diff --git a/404.html b/404.html
index 39544bc..998d81e 100644
--- a/404.html
+++ b/404.html
@@ -23,7 +23,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -69,7 +69,7 @@
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer>
diff --git a/CODE_OF_CONDUCT.html b/CODE_OF_CONDUCT.html
index bc1d232..aac1682 100644
--- a/CODE_OF_CONDUCT.html
+++ b/CODE_OF_CONDUCT.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -58,7 +58,7 @@
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/CONTRIBUTING.html b/CONTRIBUTING.html
index 551deac..04c0a62 100644
--- a/CONTRIBUTING.html
+++ b/CONTRIBUTING.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -75,7 +75,7 @@ <h2 id="code-of-conduct">Code of Conduct<a class="anchor" aria-label="anchor" hr
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/SUPPORT.html b/SUPPORT.html
index 78012fa..80ed3ad 100644
--- a/SUPPORT.html
+++ b/SUPPORT.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -65,7 +65,7 @@ <h2 id="what-happens-next">What happens next?<a class="anchor" aria-label="ancho
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/articles/doubletrouble_vignette.html b/articles/doubletrouble_vignette.html
index f7f8caa..038df9b 100644
--- a/articles/doubletrouble_vignette.html
+++ b/articles/doubletrouble_vignette.html
@@ -22,7 +22,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -679,7 +679,7 @@ <h3 id="the-full-scheme-ssd-td-pd-rtrd-dtrd-dd">The <em>full</em> scheme (SSD 
 functions).</p>
 <p>Here, we will create a list of <code>TxDb</code> objects from a list
 of <code>GRanges</code> objects using the function
-<code>makeTxDbFromGRanges</code> from <em><a href="https://bioconductor.org/packages/3.20/txdbmaker" class="external-link">txdbmaker</a></em>.
+<code>makeTxDbFromGRanges()</code> from <em><a href="https://bioconductor.org/packages/3.20/txdbmaker" class="external-link">txdbmaker</a></em>.
 Importantly, to create a <code>TxDb</code> from a <code>GRanges</code>,
 the <code>GRanges</code> object must contain genomic coordinates for all
 features, including transcripts, exons, etc. Because of that, we will
@@ -687,53 +687,6 @@ <h3 id="the-full-scheme-ssd-td-pd-rtrd-dtrd-dd">The <em>full</em> scheme (SSD 
 was not processed with <code><a href="https://rdrr.io/pkg/syntenet/man/process_input.html" class="external-link">syntenet::process_input()</a></code>.</p>
 <div class="sourceCode" id="cb11"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="kw"><a href="https://rdrr.io/r/base/library.html" class="external-link">library</a></span><span class="op">(</span><span class="va"><a href="https://bioconductor.org/packages/txdbmaker" class="external-link">txdbmaker</a></span><span class="op">)</span></span>
-<span><span class="co">#&gt; Loading required package: BiocGenerics</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt; Attaching package: 'BiocGenerics'</span></span>
-<span><span class="co">#&gt; The following objects are masked from 'package:stats':</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     IQR, mad, sd, var, xtabs</span></span>
-<span><span class="co">#&gt; The following objects are masked from 'package:base':</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     anyDuplicated, aperm, append, as.data.frame, basename, cbind,</span></span>
-<span><span class="co">#&gt;     colnames, dirname, do.call, duplicated, eval, evalq, Filter, Find,</span></span>
-<span><span class="co">#&gt;     get, grep, grepl, intersect, is.unsorted, lapply, Map, mapply,</span></span>
-<span><span class="co">#&gt;     match, mget, order, paste, pmax, pmax.int, pmin, pmin.int,</span></span>
-<span><span class="co">#&gt;     Position, rank, rbind, Reduce, rownames, sapply, setdiff, table,</span></span>
-<span><span class="co">#&gt;     tapply, union, unique, unsplit, which.max, which.min</span></span>
-<span><span class="co">#&gt; Loading required package: S4Vectors</span></span>
-<span><span class="co">#&gt; Loading required package: stats4</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt; Attaching package: 'S4Vectors'</span></span>
-<span><span class="co">#&gt; The following object is masked from 'package:utils':</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     findMatches</span></span>
-<span><span class="co">#&gt; The following objects are masked from 'package:base':</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     expand.grid, I, unname</span></span>
-<span><span class="co">#&gt; Loading required package: GenomeInfoDb</span></span>
-<span><span class="co">#&gt; Loading required package: IRanges</span></span>
-<span><span class="co">#&gt; Loading required package: GenomicRanges</span></span>
-<span><span class="co">#&gt; Loading required package: GenomicFeatures</span></span>
-<span><span class="co">#&gt; Loading required package: AnnotationDbi</span></span>
-<span><span class="co">#&gt; Loading required package: Biobase</span></span>
-<span><span class="co">#&gt; Welcome to Bioconductor</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     Vignettes contain introductory material; view with</span></span>
-<span><span class="co">#&gt;     'browseVignettes()'. To cite Bioconductor, see</span></span>
-<span><span class="co">#&gt;     'citation("Biobase")', and for packages 'citation("pkgname")'.</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt; Attaching package: 'txdbmaker'</span></span>
-<span><span class="co">#&gt; The following objects are masked from 'package:GenomicFeatures':</span></span>
-<span><span class="co">#&gt; </span></span>
-<span><span class="co">#&gt;     browseUCSCtrack, getChromInfoFromBiomart, makeFDbPackageFromUCSC,</span></span>
-<span><span class="co">#&gt;     makeFeatureDbFromUCSC, makePackageName, makeTxDb,</span></span>
-<span><span class="co">#&gt;     makeTxDbFromBiomart, makeTxDbFromEnsembl, makeTxDbFromGFF,</span></span>
-<span><span class="co">#&gt;     makeTxDbFromGRanges, makeTxDbFromUCSC, makeTxDbPackage,</span></span>
-<span><span class="co">#&gt;     makeTxDbPackageFromBiomart, makeTxDbPackageFromUCSC,</span></span>
-<span><span class="co">#&gt;     supportedMiRBaseBuildValues, supportedUCSCFeatureDbTables,</span></span>
-<span><span class="co">#&gt;     supportedUCSCFeatureDbTracks, supportedUCSCtables,</span></span>
-<span><span class="co">#&gt;     UCSCFeatureDbTableSchema</span></span>
 <span><span class="co"># Create a list of `TxDb` objects from a list of `GRanges` objects</span></span>
 <span><span class="va">txdb_list</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/pkg/BiocGenerics/man/lapply.html" class="external-link">lapply</a></span><span class="op">(</span><span class="va">yeast_annot</span>, <span class="fu">txdbmaker</span><span class="fu">::</span><span class="va">makeTxDbFromGRanges</span><span class="op">)</span></span>
 <span><span class="va">txdb_list</span></span>
@@ -744,7 +697,7 @@ <h3 id="the-full-scheme-ssd-td-pd-rtrd-dtrd-dd">The <em>full</em> scheme (SSD 
 <span><span class="co">#&gt; # Genome: NA</span></span>
 <span><span class="co">#&gt; # Nb of transcripts: 6631</span></span>
 <span><span class="co">#&gt; # Db created by: txdbmaker package from Bioconductor</span></span>
-<span><span class="co">#&gt; # Creation time: 2024-07-25 09:05:44 +0000 (Thu, 25 Jul 2024)</span></span>
+<span><span class="co">#&gt; # Creation time: 2024-10-02 09:49:23 +0000 (Wed, 02 Oct 2024)</span></span>
 <span><span class="co">#&gt; # txdbmaker version at creation time: 1.1.1</span></span>
 <span><span class="co">#&gt; # RSQLite version at creation time: 2.3.7</span></span>
 <span><span class="co">#&gt; # DBSCHEMAVERSION: 1.2</span></span>
@@ -756,7 +709,7 @@ <h3 id="the-full-scheme-ssd-td-pd-rtrd-dtrd-dd">The <em>full</em> scheme (SSD 
 <span><span class="co">#&gt; # Genome: NA</span></span>
 <span><span class="co">#&gt; # Nb of transcripts: 5389</span></span>
 <span><span class="co">#&gt; # Db created by: txdbmaker package from Bioconductor</span></span>
-<span><span class="co">#&gt; # Creation time: 2024-07-25 09:05:45 +0000 (Thu, 25 Jul 2024)</span></span>
+<span><span class="co">#&gt; # Creation time: 2024-10-02 09:49:23 +0000 (Wed, 02 Oct 2024)</span></span>
 <span><span class="co">#&gt; # txdbmaker version at creation time: 1.1.1</span></span>
 <span><span class="co">#&gt; # RSQLite version at creation time: 2.3.7</span></span>
 <span><span class="co">#&gt; # DBSCHEMAVERSION: 1.2</span></span></code></pre></div>
@@ -912,6 +865,11 @@ <h2 id="calculating-substitution-rates-for-duplicated-gene-pairs">Calculating su
 <span><span class="co">#&gt; 3 Q0070 Q0045 0.296216 0.438575 0.675405   TD</span></span>
 <span><span class="co">#&gt; 4 Q0070 Q0065 0.394617 0.582050 0.677977   TD</span></span>
 <span><span class="co">#&gt; 5 Q0055 Q0050 0.629343 4.257430 0.147822   TD</span></span></code></pre></div>
+<p>Importantly, <code><a href="../reference/pairs2kaks.html">pairs2kaks()</a></code> expects all genes in the gene
+pairs to be present in the CDS, with matching names. Species
+abbreviations in gene pairs (added by <em><a href="https://bioconductor.org/packages/3.20/syntenet" class="external-link">syntenet</a></em>)
+are automatically removed, so you should not add them to the sequence
+names of your CDS.</p>
 </div>
 <div class="section level2">
 <h2 id="identifying-and-visualizing-k_s-peaks">Identifying and visualizing
@@ -958,13 +916,13 @@ <h2 id="identifying-and-visualizing-k_s-peaks">Identifying and visualizing
 <code class="sourceCode R"><span><span class="co"># Load data and inspect it</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/data.html" class="external-link">data</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">)</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">)</span></span>
-<span><span class="co">#&gt;               dup1            dup2     Ks</span></span>
-<span><span class="co">#&gt; 1  GLYMA_01G000100 GLYMA_15G276800 0.3750</span></span>
-<span><span class="co">#&gt; 3  GLYMA_01G000400 GLYMA_02G312300 0.0453</span></span>
-<span><span class="co">#&gt; 8  GLYMA_01G000600 GLYMA_14G000400 0.1040</span></span>
-<span><span class="co">#&gt; 10 GLYMA_01G000800 GLYMA_03G188200 0.4730</span></span>
-<span><span class="co">#&gt; 11 GLYMA_01G000800 GLYMA_05G115300 1.2300</span></span>
-<span><span class="co">#&gt; 12 GLYMA_01G000800 GLYMA_17G191100 1.6600</span></span>
+<span><span class="co">#&gt;              dup1            dup2     Ks type</span></span>
+<span><span class="co">#&gt; 1 GLYMA_07G035600 GLYMA_16G004800 0.1670   SD</span></span>
+<span><span class="co">#&gt; 2 GLYMA_18G275200 GLYMA_08G252600 0.1070   SD</span></span>
+<span><span class="co">#&gt; 3 GLYMA_09G282200 GLYMA_20G003400 0.0822   SD</span></span>
+<span><span class="co">#&gt; 4 GLYMA_01G166400 GLYMA_11G077000 0.0904   SD</span></span>
+<span><span class="co">#&gt; 5 GLYMA_07G252100 GLYMA_17G022300 0.1400   SD</span></span>
+<span><span class="co">#&gt; 6 GLYMA_05G133100 GLYMA_08G087600 0.0883   SD</span></span>
 <span></span>
 <span><span class="co"># Plot distribution</span></span>
 <span><span class="fu"><a href="../reference/plot_ks_distro.html">plot_ks_distro</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">)</span></span></code></pre></div>
@@ -983,22 +941,22 @@ <h2 id="identifying-and-visualizing-k_s-peaks">Identifying and visualizing
 <span><span class="va">peaks</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/find_ks_peaks.html">find_ks_peaks</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">$</span><span class="va">Ks</span>, npeaks <span class="op">=</span> <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">2</span>, <span class="fl">3</span><span class="op">)</span>, verbose <span class="op">=</span> <span class="cn">TRUE</span><span class="op">)</span></span>
 <span><span class="co">#&gt; Optimal number of peaks: 3</span></span>
 <span><span class="co">#&gt; Bayesian Information Criterion (BIC): </span></span>
-<span><span class="co">#&gt;           E         V</span></span>
-<span><span class="co">#&gt; 2 -86950.26 -67759.43</span></span>
-<span><span class="co">#&gt; 3 -86977.90 -54202.26</span></span>
+<span><span class="co">#&gt;            E         V</span></span>
+<span><span class="co">#&gt; 2 -100166.88 -88545.37</span></span>
+<span><span class="co">#&gt; 3  -90965.45 -75323.66</span></span>
 <span><span class="co">#&gt; </span></span>
 <span><span class="co">#&gt; Top 3 models based on the BIC criterion: </span></span>
-<span><span class="co">#&gt;       V,3       V,2       E,2 </span></span>
-<span><span class="co">#&gt; -54202.26 -67759.43 -86950.26</span></span>
+<span><span class="co">#&gt;       V,3       V,2       E,3 </span></span>
+<span><span class="co">#&gt; -75323.66 -88545.37 -90965.45</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">peaks</span><span class="op">)</span></span>
 <span><span class="co">#&gt; [1] "mean"   "sd"     "lambda" "ks"</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/str.html" class="external-link">str</a></span><span class="op">(</span><span class="va">peaks</span><span class="op">)</span></span>
 <span><span class="co">#&gt; List of 4</span></span>
-<span><span class="co">#&gt;  $ mean  : Named num [1:3] 0.118 0.531 1.482</span></span>
+<span><span class="co">#&gt;  $ mean  : Named num [1:3] 0.123 0.601 1.596</span></span>
 <span><span class="co">#&gt;   ..- attr(*, "names")= chr [1:3] "1" "2" "3"</span></span>
-<span><span class="co">#&gt;  $ sd    : num [1:3] 0.0549 0.2443 0.3134</span></span>
-<span><span class="co">#&gt;  $ lambda: num [1:3] 0.352 0.433 0.215</span></span>
-<span><span class="co">#&gt;  $ ks    : num [1:71232] 0.375 0.0453 0.104 0.473 1.23 1.66 1.72 0.13 0.0856 1.96 ...</span></span>
+<span><span class="co">#&gt;  $ sd    : num [1:3] 0.0572 0.287 0.2503</span></span>
+<span><span class="co">#&gt;  $ lambda: num [1:3] 0.285 0.44 0.276</span></span>
+<span><span class="co">#&gt;  $ ks    : num [1:68085] 0.167 0.107 0.0822 0.0904 0.14 0.0883 0.107 0.756 0.737 0.0872 ...</span></span>
 <span></span>
 <span><span class="co"># Visualize Ks distribution</span></span>
 <span><span class="fu"><a href="../reference/plot_ks_peaks.html">plot_ks_peaks</a></span><span class="op">(</span><span class="va">peaks</span><span class="op">)</span></span></code></pre></div>
@@ -1065,16 +1023,16 @@ <h2 id="classifying-genes-by-age-groups">Classifying genes by age groups<a class
 <div class="sourceCode" id="cb20"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># Gene pairs without age-based classification</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">)</span></span>
-<span><span class="co">#&gt;               dup1            dup2     Ks</span></span>
-<span><span class="co">#&gt; 1  GLYMA_01G000100 GLYMA_15G276800 0.3750</span></span>
-<span><span class="co">#&gt; 3  GLYMA_01G000400 GLYMA_02G312300 0.0453</span></span>
-<span><span class="co">#&gt; 8  GLYMA_01G000600 GLYMA_14G000400 0.1040</span></span>
-<span><span class="co">#&gt; 10 GLYMA_01G000800 GLYMA_03G188200 0.4730</span></span>
-<span><span class="co">#&gt; 11 GLYMA_01G000800 GLYMA_05G115300 1.2300</span></span>
-<span><span class="co">#&gt; 12 GLYMA_01G000800 GLYMA_17G191100 1.6600</span></span>
+<span><span class="co">#&gt;              dup1            dup2     Ks type</span></span>
+<span><span class="co">#&gt; 1 GLYMA_07G035600 GLYMA_16G004800 0.1670   SD</span></span>
+<span><span class="co">#&gt; 2 GLYMA_18G275200 GLYMA_08G252600 0.1070   SD</span></span>
+<span><span class="co">#&gt; 3 GLYMA_09G282200 GLYMA_20G003400 0.0822   SD</span></span>
+<span><span class="co">#&gt; 4 GLYMA_01G166400 GLYMA_11G077000 0.0904   SD</span></span>
+<span><span class="co">#&gt; 5 GLYMA_07G252100 GLYMA_17G022300 0.1400   SD</span></span>
+<span><span class="co">#&gt; 6 GLYMA_05G133100 GLYMA_08G087600 0.0883   SD</span></span>
 <span></span>
 <span><span class="co"># Classify gene pairs by age group</span></span>
-<span><span class="va">pairs_age_group</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/split_pairs_by_peak.html">split_pairs_by_peak</a></span><span class="op">(</span><span class="va">gmax_ks</span>, <span class="va">peaks</span><span class="op">)</span></span>
+<span><span class="va">pairs_age_group</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/split_pairs_by_peak.html">split_pairs_by_peak</a></span><span class="op">(</span><span class="va">gmax_ks</span><span class="op">[</span>, <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">1</span>,<span class="fl">2</span>,<span class="fl">3</span><span class="op">)</span><span class="op">]</span>, <span class="va">peaks</span><span class="op">)</span></span>
 <span></span>
 <span><span class="co"># Inspecting the output</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">pairs_age_group</span><span class="op">)</span></span>
@@ -1082,17 +1040,53 @@ <h2 id="classifying-genes-by-age-groups">Classifying genes by age groups<a class
 <span></span>
 <span><span class="co"># Take a look at the classified gene pairs</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">pairs_age_group</span><span class="op">$</span><span class="va">pairs</span><span class="op">)</span></span>
-<span><span class="co">#&gt;               dup1            dup2     ks peak</span></span>
-<span><span class="co">#&gt; 1  GLYMA_01G000100 GLYMA_15G276800 0.3750    1</span></span>
-<span><span class="co">#&gt; 3  GLYMA_01G000400 GLYMA_02G312300 0.0453    1</span></span>
-<span><span class="co">#&gt; 8  GLYMA_01G000600 GLYMA_14G000400 0.1040    1</span></span>
-<span><span class="co">#&gt; 10 GLYMA_01G000800 GLYMA_03G188200 0.4730    1</span></span>
-<span><span class="co">#&gt; 16 GLYMA_01G001000 GLYMA_08G359900 0.1300    1</span></span>
-<span><span class="co">#&gt; 18 GLYMA_01G001100 GLYMA_08G359700 0.0856    1</span></span>
+<span><span class="co">#&gt;              dup1            dup2     ks peak</span></span>
+<span><span class="co">#&gt; 1 GLYMA_07G035600 GLYMA_16G004800 0.1670    1</span></span>
+<span><span class="co">#&gt; 2 GLYMA_18G275200 GLYMA_08G252600 0.1070    1</span></span>
+<span><span class="co">#&gt; 3 GLYMA_09G282200 GLYMA_20G003400 0.0822    1</span></span>
+<span><span class="co">#&gt; 4 GLYMA_01G166400 GLYMA_11G077000 0.0904    1</span></span>
+<span><span class="co">#&gt; 5 GLYMA_07G252100 GLYMA_17G022300 0.1400    1</span></span>
+<span><span class="co">#&gt; 6 GLYMA_05G133100 GLYMA_08G087600 0.0883    1</span></span>
 <span></span>
 <span><span class="co"># Visualize Ks distro with age boundaries</span></span>
 <span><span class="va">pairs_age_group</span><span class="op">$</span><span class="va">plot</span></span></code></pre></div>
 <p><img src="doubletrouble_vignette_files/figure-html/split_by_peak-1.png" width="700"></p>
+<p>Age groups can also be used to identify SD gene pairs that likely
+originated from whole-genome duplications. The rationale here is that
+segmental duplicates with
+<math display="inline" xmlns="http://www.w3.org/1998/Math/MathML"><semantics><msub><mi>K</mi><mi>s</mi></msub><annotation encoding="application/x-tex">K_s</annotation></semantics></math>
+values near
+<math display="inline" xmlns="http://www.w3.org/1998/Math/MathML"><semantics><msub><mi>K</mi><mi>s</mi></msub><annotation encoding="application/x-tex">K_s</annotation></semantics></math>
+peaks (indicating WGD events) were likely created by such WGDs. In a
+similar logic, SD pairs with
+<math display="inline" xmlns="http://www.w3.org/1998/Math/MathML"><semantics><msub><mi>K</mi><mi>s</mi></msub><annotation encoding="application/x-tex">K_s</annotation></semantics></math>
+values that are too distant from
+<math display="inline" xmlns="http://www.w3.org/1998/Math/MathML"><semantics><msub><mi>K</mi><mi>s</mi></msub><annotation encoding="application/x-tex">K_s</annotation></semantics></math>
+peaks (e.g., &gt;2 standard deviations away from the mean) were likely
+created by duplications of large genomic segments, but not duplications
+of the entire genome.</p>
+<p>As an example, to find gene pairs in the soybean genome that likely
+originated from the WGD event shared by all legumes (at ~58 million
+years ago), you’d need to extract SD pairs in age group 2 using the
+following code:</p>
+<div class="sourceCode" id="cb21"><pre class="downlit sourceCode r">
+<code class="sourceCode R"><span><span class="co"># Get all pairs in age group 2</span></span>
+<span><span class="va">pairs_ag2</span> <span class="op">&lt;-</span> <span class="va">pairs_age_group</span><span class="op">$</span><span class="va">pairs</span><span class="op">[</span><span class="va">pairs_age_group</span><span class="op">$</span><span class="va">pairs</span><span class="op">$</span><span class="va">peak</span> <span class="op">==</span> <span class="fl">2</span>, <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">1</span>,<span class="fl">2</span><span class="op">)</span><span class="op">]</span></span>
+<span></span>
+<span><span class="co"># Get all SD pairs</span></span>
+<span><span class="va">sd_pairs</span> <span class="op">&lt;-</span> <span class="va">gmax_ks</span><span class="op">[</span><span class="va">gmax_ks</span><span class="op">$</span><span class="va">type</span> <span class="op">==</span> <span class="st">"SD"</span>, <span class="fu"><a href="https://rdrr.io/r/base/c.html" class="external-link">c</a></span><span class="op">(</span><span class="fl">1</span>,<span class="fl">2</span><span class="op">)</span><span class="op">]</span></span>
+<span></span>
+<span><span class="co"># Merge tables</span></span>
+<span><span class="va">pairs_wgd_legumes</span> <span class="op">&lt;-</span> <span class="fu"><a href="https://rdrr.io/pkg/S4Vectors/man/Vector-merge.html" class="external-link">merge</a></span><span class="op">(</span><span class="va">pairs_ag2</span>, <span class="va">sd_pairs</span><span class="op">)</span></span>
+<span></span>
+<span><span class="fu"><a href="https://rdrr.io/r/utils/head.html" class="external-link">head</a></span><span class="op">(</span><span class="va">pairs_wgd_legumes</span><span class="op">)</span></span>
+<span><span class="co">#&gt;              dup1            dup2</span></span>
+<span><span class="co">#&gt; 1 GLYMA_01G001800 GLYMA_07G130700</span></span>
+<span><span class="co">#&gt; 2 GLYMA_01G002100 GLYMA_05G221300</span></span>
+<span><span class="co">#&gt; 3 GLYMA_01G002300 GLYMA_07G130100</span></span>
+<span><span class="co">#&gt; 4 GLYMA_01G002600 GLYMA_07G129700</span></span>
+<span><span class="co">#&gt; 5 GLYMA_01G003500 GLYMA_05G222800</span></span>
+<span><span class="co">#&gt; 6 GLYMA_01G003500 GLYMA_08G029700</span></span></code></pre></div>
 </div>
 <div class="section level2">
 <h2 id="data-visualization">Data visualization<a class="anchor" aria-label="anchor" href="#data-visualization"></a>
@@ -1112,7 +1106,7 @@ <h3 id="visualizing-the-frequency-of-duplicates-per-mode">Visualizing the freque
 demonstrate how this works, we will use an example data set with
 duplicate pairs for 3 fungi species (and substitution rates, which will
 be ignored by <code><a href="../reference/duplicates2counts.html">duplicates2counts()</a></code>).</p>
-<div class="sourceCode" id="cb21"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb22"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># Load data set with pre-computed duplicates for 3 fungi species</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/utils/data.html" class="external-link">data</a></span><span class="op">(</span><span class="va">fungi_kaks</span><span class="op">)</span></span>
 <span><span class="fu"><a href="https://rdrr.io/r/base/names.html" class="external-link">names</a></span><span class="op">(</span><span class="va">fungi_kaks</span><span class="op">)</span></span>
@@ -1154,7 +1148,7 @@ <h3 id="visualizing-the-frequency-of-duplicates-per-mode">Visualizing the freque
 duplication type with the function <code><a href="../reference/plot_duplicate_freqs.html">plot_duplicate_freqs()</a></code>.
 You can visualize frequencies in three different ways, as demonstrated
 below.</p>
-<div class="sourceCode" id="cb22"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb23"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># A) Facets</span></span>
 <span><span class="va">p1</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/plot_duplicate_freqs.html">plot_duplicate_freqs</a></span><span class="op">(</span><span class="va">counts_table</span><span class="op">)</span></span>
 <span></span>
@@ -1167,18 +1161,18 @@ <h3 id="visualizing-the-frequency-of-duplicates-per-mode">Visualizing the freque
 <span><span class="co"># Combine plots, one per row</span></span>
 <span><span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/wrap_plots.html" class="external-link">wrap_plots</a></span><span class="op">(</span><span class="va">p1</span>, <span class="va">p2</span>, <span class="va">p3</span>, nrow <span class="op">=</span> <span class="fl">3</span><span class="op">)</span> <span class="op">+</span> </span>
 <span>    <span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/plot_annotation.html" class="external-link">plot_annotation</a></span><span class="op">(</span>tag_levels <span class="op">=</span> <span class="st">"A"</span><span class="op">)</span></span></code></pre></div>
-<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-5-1.png" width="700"></p>
+<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png" width="700"></p>
 <p>If you want to visually the frequency of duplicated
 <strong>genes</strong> (not gene pairs), you’d first need to classify
 genes into unique modes of duplication with
 <code><a href="../reference/classify_genes.html">classify_genes()</a></code>, and then repeat the code above. For
 example:</p>
-<div class="sourceCode" id="cb23"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb24"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># Frequency of duplicated genes by mode</span></span>
 <span><span class="fu"><a href="../reference/classify_genes.html">classify_genes</a></span><span class="op">(</span><span class="va">fungi_kaks</span><span class="op">)</span> <span class="op">|&gt;</span>   <span class="co"># classify genes into unique duplication types</span></span>
 <span>    <span class="fu"><a href="../reference/duplicates2counts.html">duplicates2counts</a></span><span class="op">(</span><span class="op">)</span> <span class="op">|&gt;</span>      <span class="co"># get a data frame of counts (long format)</span></span>
 <span>    <span class="fu"><a href="../reference/plot_duplicate_freqs.html">plot_duplicate_freqs</a></span><span class="op">(</span><span class="op">)</span>      <span class="co"># plot frequencies</span></span></code></pre></div>
-<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png" width="768"></p>
+<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png" width="768"></p>
 </div>
 <div class="section level3">
 <h3 id="visualizing-k_s-distributions">Visualizing
@@ -1189,7 +1183,7 @@ <h3 id="visualizing-k_s-distributions">Visualizing
 <math display="inline" xmlns="http://www.w3.org/1998/Math/MathML"><semantics><msub><mi>K</mi><mi>s</mi></msub><annotation encoding="application/x-tex">K_s</annotation></semantics></math>
 distribution for the whole paranome, you will use the function
 <code><a href="../reference/plot_ks_distro.html">plot_ks_distro()</a></code>.</p>
-<div class="sourceCode" id="cb24"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb25"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="va">ks_df</span> <span class="op">&lt;-</span> <span class="va">fungi_kaks</span><span class="op">$</span><span class="va">saccharomyces_cerevisiae</span></span>
 <span></span>
 <span><span class="co"># A) Histogram, whole paranome</span></span>
@@ -1204,7 +1198,7 @@ <h3 id="visualizing-k_s-distributions">Visualizing
 <span><span class="co"># Combine plots side by side</span></span>
 <span><span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/wrap_plots.html" class="external-link">wrap_plots</a></span><span class="op">(</span><span class="va">p1</span>, <span class="va">p2</span>, <span class="va">p3</span>, nrow <span class="op">=</span> <span class="fl">1</span><span class="op">)</span> <span class="op">+</span></span>
 <span>    <span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/plot_annotation.html" class="external-link">plot_annotation</a></span><span class="op">(</span>tag_levels <span class="op">=</span> <span class="st">"A"</span><span class="op">)</span></span></code></pre></div>
-<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png" width="864"></p>
+<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png" width="864"></p>
 <p>However, visualizing the distribution for the whole paranome can mask
 patterns that only happen for duplicates originating from particular
 duplication types. For instance, when looking for evidence of WGD
@@ -1214,7 +1208,7 @@ <h3 id="visualizing-k_s-distributions">Visualizing
 cluster together, suggesting the presence of WGD history. To visualize
 the distribution by duplication type, use <code>bytype = TRUE</code> in
 <code><a href="../reference/plot_ks_distro.html">plot_ks_distro()</a></code>.</p>
-<div class="sourceCode" id="cb25"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb26"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># A) Duplicates by type, histogram</span></span>
 <span><span class="va">p1</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/plot_ks_distro.html">plot_ks_distro</a></span><span class="op">(</span><span class="va">ks_df</span>, bytype <span class="op">=</span> <span class="cn">TRUE</span>, plot_type <span class="op">=</span> <span class="st">"histogram"</span><span class="op">)</span></span>
 <span></span>
@@ -1224,7 +1218,7 @@ <h3 id="visualizing-k_s-distributions">Visualizing
 <span><span class="co"># Combine plots side by side</span></span>
 <span><span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/wrap_plots.html" class="external-link">wrap_plots</a></span><span class="op">(</span><span class="va">p1</span>, <span class="va">p2</span><span class="op">)</span> <span class="op">+</span></span>
 <span>    <span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/plot_annotation.html" class="external-link">plot_annotation</a></span><span class="op">(</span>tag_levels <span class="op">=</span> <span class="st">"A"</span><span class="op">)</span></span></code></pre></div>
-<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png" width="768"></p>
+<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png" width="768"></p>
 </div>
 <div class="section level3">
 <h3 id="visualizing-substitution-rates-by-species">Visualizing substitution rates by species<a class="anchor" aria-label="anchor" href="#visualizing-substitution-rates-by-species"></a>
@@ -1238,7 +1232,7 @@ <h3 id="visualizing-substitution-rates-by-species">Visualizing substitution rate
 by species. You can choose which rate you want to visualize, and whether
 or not to group gene pairs by duplication mode, as demonstrated
 below.</p>
-<div class="sourceCode" id="cb26"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb27"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="co"># A) Ks for each species</span></span>
 <span><span class="va">p1</span> <span class="op">&lt;-</span> <span class="fu"><a href="../reference/plot_rates_by_species.html">plot_rates_by_species</a></span><span class="op">(</span><span class="va">fungi_kaks</span><span class="op">)</span></span>
 <span></span>
@@ -1248,65 +1242,65 @@ <h3 id="visualizing-substitution-rates-by-species">Visualizing substitution rate
 <span><span class="co"># Combine plots - one per row</span></span>
 <span><span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/wrap_plots.html" class="external-link">wrap_plots</a></span><span class="op">(</span><span class="va">p1</span>, <span class="va">p2</span>, nrow <span class="op">=</span> <span class="fl">2</span><span class="op">)</span> <span class="op">+</span></span>
 <span>    <span class="fu">patchwork</span><span class="fu">::</span><span class="fu"><a href="https://patchwork.data-imaginist.com/reference/plot_annotation.html" class="external-link">plot_annotation</a></span><span class="op">(</span>tag_levels <span class="op">=</span> <span class="st">"A"</span><span class="op">)</span></span></code></pre></div>
-<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png" width="576"></p>
+<p><img src="doubletrouble_vignette_files/figure-html/unnamed-chunk-10-1.png" width="576"></p>
 </div>
 </div>
 <div class="section level2">
 <h2 class="unnumbered" id="session-information">Session information<a class="anchor" aria-label="anchor" href="#session-information"></a>
 </h2>
 <p>This document was created under the following conditions:</p>
-<div class="sourceCode" id="cb27"><pre class="downlit sourceCode r">
+<div class="sourceCode" id="cb28"><pre class="downlit sourceCode r">
 <code class="sourceCode R"><span><span class="fu">sessioninfo</span><span class="fu">::</span><span class="fu"><a href="https://r-lib.github.io/sessioninfo/reference/session_info.html" class="external-link">session_info</a></span><span class="op">(</span><span class="op">)</span></span>
 <span><span class="co">#&gt; <span style="color: #00BBBB; font-weight: bold;">─ Session info ───────────────────────────────────────────────────────────────</span></span></span>
 <span><span class="co">#&gt;  <span style="color: #555555; font-style: italic;">setting </span> <span style="color: #555555; font-style: italic;">value</span></span></span>
 <span><span class="co">#&gt;  version  R version 4.4.1 (2024-06-14)</span></span>
-<span><span class="co">#&gt;  os       Ubuntu 22.04.4 LTS</span></span>
+<span><span class="co">#&gt;  os       Ubuntu 22.04.5 LTS</span></span>
 <span><span class="co">#&gt;  system   x86_64, linux-gnu</span></span>
 <span><span class="co">#&gt;  ui       X11</span></span>
 <span><span class="co">#&gt;  language en</span></span>
 <span><span class="co">#&gt;  collate  en_US.UTF-8</span></span>
 <span><span class="co">#&gt;  ctype    en_US.UTF-8</span></span>
 <span><span class="co">#&gt;  tz       UTC</span></span>
-<span><span class="co">#&gt;  date     2024-07-25</span></span>
-<span><span class="co">#&gt;  pandoc   3.2 @ /usr/bin/ (via rmarkdown)</span></span>
+<span><span class="co">#&gt;  date     2024-10-02</span></span>
+<span><span class="co">#&gt;  pandoc   3.4 @ /usr/bin/ (via rmarkdown)</span></span>
 <span><span class="co">#&gt; </span></span>
 <span><span class="co">#&gt; <span style="color: #00BBBB; font-weight: bold;">─ Packages ───────────────────────────────────────────────────────────────────</span></span></span>
 <span><span class="co">#&gt;  <span style="color: #555555; font-style: italic;">package             </span> <span style="color: #555555; font-style: italic;">*</span> <span style="color: #555555; font-style: italic;">version  </span> <span style="color: #555555; font-style: italic;">date (UTC)</span> <span style="color: #555555; font-style: italic;">lib</span> <span style="color: #555555; font-style: italic;">source</span></span></span>
-<span><span class="co">#&gt;  abind                  1.4-5     <span style="color: #555555;">2016-07-21</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  abind                  1.4-8     <span style="color: #555555;">2024-09-12</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  ade4                   1.7-22    <span style="color: #555555;">2023-02-06</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  AnnotationDbi        * 1.67.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  ape                    5.8       <span style="color: #555555;">2024-04-11</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  Biobase              * 2.65.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  Biobase              * 2.65.1    <span style="color: #555555;">2024-08-28</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  BiocFileCache          2.13.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  BiocGenerics         * 0.51.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  BiocIO                 1.15.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  BiocManager            1.30.23   <span style="color: #555555;">2024-05-04</span> <span style="color: #555555;">[2]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  BiocGenerics         * 0.51.2    <span style="color: #555555;">2024-09-27</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  BiocIO                 1.15.2    <span style="color: #555555;">2024-08-23</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  BiocManager            1.30.25   <span style="color: #555555;">2024-08-28</span> <span style="color: #555555;">[2]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  BiocParallel           1.39.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  BiocStyle            * 2.33.1    <span style="color: #555555;">2024-06-12</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  biomaRt                2.61.2    <span style="color: #555555;">2024-06-24</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
-<span><span class="co">#&gt;  Biostrings             2.73.1    <span style="color: #555555;">2024-06-02</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  bit                    4.0.5     <span style="color: #555555;">2022-11-15</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  bit64                  4.0.5     <span style="color: #555555;">2020-08-30</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  bitops                 1.0-7     <span style="color: #555555;">2021-04-24</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  biomaRt                2.61.3    <span style="color: #555555;">2024-08-06</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  Biostrings             2.73.2    <span style="color: #555555;">2024-09-26</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  bit                    4.5.0     <span style="color: #555555;">2024-09-20</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  bit64                  4.5.2     <span style="color: #555555;">2024-09-22</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  bitops                 1.0-8     <span style="color: #555555;">2024-07-29</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  blob                   1.2.4     <span style="color: #555555;">2023-03-17</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  bookdown               0.40      <span style="color: #555555;">2024-07-02</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  bslib                  0.7.0     <span style="color: #555555;">2024-03-29</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  bslib                  0.8.0     <span style="color: #555555;">2024-07-29</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  cachem                 1.1.0     <span style="color: #555555;">2024-05-16</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  cli                    3.6.3     <span style="color: #555555;">2024-06-21</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  coda                   0.19-4.1  <span style="color: #555555;">2024-01-31</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  codetools              0.2-20    <span style="color: #555555;">2024-03-31</span> <span style="color: #555555;">[3]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
-<span><span class="co">#&gt;  colorspace             2.1-0     <span style="color: #555555;">2023-01-23</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  colorspace             2.1-1     <span style="color: #555555;">2024-07-26</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  crayon                 1.5.3     <span style="color: #555555;">2024-06-20</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  curl                   5.2.1     <span style="color: #555555;">2024-03-01</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  curl                   5.2.3     <span style="color: #555555;">2024-09-20</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  DBI                    1.2.3     <span style="color: #555555;">2024-06-02</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  dbplyr                 2.5.0     <span style="color: #555555;">2024-03-19</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  DelayedArray           0.31.9    <span style="color: #555555;">2024-07-17</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  DelayedArray           0.31.12   <span style="color: #555555;">2024-09-27</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  desc                   1.4.3     <span style="color: #555555;">2023-12-10</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  digest                 0.6.36    <span style="color: #555555;">2024-06-23</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  digest                 0.6.37    <span style="color: #555555;">2024-08-19</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  doParallel             1.0.17    <span style="color: #555555;">2022-02-07</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  doubletrouble        * 1.5.1     <span style="color: #555555;">2024-07-25</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor</span></span></span>
+<span><span class="co">#&gt;  doubletrouble        * 1.5.2     <span style="color: #555555;">2024-10-02</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor</span></span></span>
 <span><span class="co">#&gt;  dplyr                  1.1.4     <span style="color: #555555;">2023-11-17</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  evaluate               0.24.0    <span style="color: #555555;">2024-06-10</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  evaluate               1.0.0     <span style="color: #555555;">2024-09-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  fansi                  1.0.6     <span style="color: #555555;">2023-12-08</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  farver                 2.1.2     <span style="color: #555555;">2024-05-13</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  fastmap                1.2.0     <span style="color: #555555;">2024-05-15</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
@@ -1316,30 +1310,30 @@ <h2 class="unnumbered" id="session-information">Session information<a class="anc
 <span><span class="co">#&gt;  fs                     1.6.4     <span style="color: #555555;">2024-04-25</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  generics               0.1.3     <span style="color: #555555;">2022-07-05</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  GenomeInfoDb         * 1.41.1    <span style="color: #555555;">2024-05-24</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  GenomeInfoDbData       1.2.12    <span style="color: #555555;">2024-06-24</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor</span></span></span>
+<span><span class="co">#&gt;  GenomeInfoDbData       1.2.13    <span style="color: #555555;">2024-10-02</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor</span></span></span>
 <span><span class="co">#&gt;  GenomicAlignments      1.41.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  GenomicFeatures      * 1.57.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  GenomicFeatures      * 1.57.1    <span style="color: #555555;">2024-09-27</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  GenomicRanges        * 1.57.1    <span style="color: #555555;">2024-06-12</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  ggnetwork              0.5.13    <span style="color: #555555;">2024-02-14</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  ggplot2                3.5.1     <span style="color: #555555;">2024-04-23</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  glue                   1.7.0     <span style="color: #555555;">2024-01-09</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  glue                   1.8.0     <span style="color: #555555;">2024-09-30</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  gtable                 0.3.5     <span style="color: #555555;">2024-04-22</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  highr                  0.11      <span style="color: #555555;">2024-05-26</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  hms                    1.1.3     <span style="color: #555555;">2023-03-21</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  htmltools              0.5.8.1   <span style="color: #555555;">2024-04-04</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  htmlwidgets            1.6.4     <span style="color: #555555;">2023-12-06</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  httr                   1.4.7     <span style="color: #555555;">2023-08-15</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  httr2                  1.0.2     <span style="color: #555555;">2024-07-16</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  httr2                  1.0.5     <span style="color: #555555;">2024-09-26</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  igraph                 2.0.3     <span style="color: #555555;">2024-03-13</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  intergraph             2.0-4     <span style="color: #555555;">2024-02-01</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  IRanges              * 2.39.2    <span style="color: #555555;">2024-07-17</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  iterators              1.0.14    <span style="color: #555555;">2022-02-05</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  jquerylib              0.1.4     <span style="color: #555555;">2021-04-26</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  jsonlite               1.8.8     <span style="color: #555555;">2023-12-04</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  jsonlite               1.8.9     <span style="color: #555555;">2024-09-20</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  KEGGREST               1.45.1    <span style="color: #555555;">2024-06-17</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  KernSmooth             2.23-24   <span style="color: #555555;">2024-05-17</span> <span style="color: #555555;">[3]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  knitr                  1.48      <span style="color: #555555;">2024-07-07</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  ks                     1.14.2    <span style="color: #555555;">2024-01-15</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  ks                     1.14.3    <span style="color: #555555;">2024-09-20</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  labeling               0.4.3     <span style="color: #555555;">2023-08-29</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  lattice                0.22-6    <span style="color: #555555;">2024-03-20</span> <span style="color: #555555;">[3]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  lifecycle              1.0.4     <span style="color: #555555;">2023-11-07</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
@@ -1347,20 +1341,20 @@ <h2 class="unnumbered" id="session-information">Session information<a class="anc
 <span><span class="co">#&gt;  MASS                   7.3-61    <span style="color: #555555;">2024-06-13</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  Matrix                 1.7-0     <span style="color: #555555;">2024-04-26</span> <span style="color: #555555;">[3]</span> <span style="color: #555555;">CRAN (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  MatrixGenerics         1.17.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  matrixStats            1.3.0     <span style="color: #555555;">2024-04-11</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  matrixStats            1.4.1     <span style="color: #555555;">2024-09-08</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  mclust                 6.1.1     <span style="color: #555555;">2024-04-29</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  memoise                2.0.1     <span style="color: #555555;">2021-11-26</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  MSA2dist               1.9.0     <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  munsell                0.5.1     <span style="color: #555555;">2024-04-01</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  mvtnorm                1.2-5     <span style="color: #555555;">2024-05-21</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  mvtnorm                1.3-1     <span style="color: #555555;">2024-09-03</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  network                1.18.2    <span style="color: #555555;">2023-12-05</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  networkD3              0.4       <span style="color: #555555;">2017-03-18</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  nlme                   3.1-165   <span style="color: #555555;">2024-06-06</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  patchwork              1.2.0     <span style="color: #555555;">2024-01-08</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  nlme                   3.1-166   <span style="color: #555555;">2024-08-14</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  patchwork              1.3.0     <span style="color: #555555;">2024-09-16</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  pheatmap               1.0.12    <span style="color: #555555;">2019-01-04</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  pillar                 1.9.0     <span style="color: #555555;">2023-03-22</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  pkgconfig              2.0.3     <span style="color: #555555;">2019-09-22</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  pkgdown                2.1.0     <span style="color: #555555;">2024-07-06</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  pkgdown                2.1.1     <span style="color: #555555;">2024-09-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  png                    0.1-8     <span style="color: #555555;">2022-11-29</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  pracma                 2.4.4     <span style="color: #555555;">2023-11-10</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  prettyunits            1.2.0     <span style="color: #555555;">2023-09-24</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
@@ -1368,29 +1362,29 @@ <h2 class="unnumbered" id="session-information">Session information<a class="anc
 <span><span class="co">#&gt;  purrr                  1.0.2     <span style="color: #555555;">2023-08-10</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  pwalign                1.1.0     <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  R6                     2.5.1     <span style="color: #555555;">2021-08-19</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  ragg                   1.3.2     <span style="color: #555555;">2024-05-15</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  ragg                   1.3.3     <span style="color: #555555;">2024-09-11</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  rappdirs               0.3.3     <span style="color: #555555;">2021-01-31</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  RColorBrewer           1.1-3     <span style="color: #555555;">2022-04-03</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  Rcpp                   1.0.13    <span style="color: #555555;">2024-07-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  RCurl                  1.98-1.16 <span style="color: #555555;">2024-07-11</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  restfulr               0.0.15    <span style="color: #555555;">2022-06-16</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  rjson                  0.2.21    <span style="color: #555555;">2022-01-09</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  rjson                  0.2.23    <span style="color: #555555;">2024-09-16</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  rlang                  1.1.4     <span style="color: #555555;">2024-06-04</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  rmarkdown              2.27      <span style="color: #555555;">2024-05-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  Rsamtools              2.21.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  rmarkdown              2.28      <span style="color: #555555;">2024-08-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  Rsamtools              2.21.2    <span style="color: #555555;">2024-09-26</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  RSQLite                2.3.7     <span style="color: #555555;">2024-05-27</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  rtracklayer            1.65.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  S4Arrays               1.5.5     <span style="color: #555555;">2024-07-21</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  S4Arrays               1.5.10    <span style="color: #555555;">2024-09-29</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  S4Vectors            * 0.43.2    <span style="color: #555555;">2024-07-17</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  sass                   0.4.9     <span style="color: #555555;">2024-03-15</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  scales                 1.3.0     <span style="color: #555555;">2023-11-28</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  seqinr                 4.2-36    <span style="color: #555555;">2023-12-08</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  sessioninfo            1.2.2     <span style="color: #555555;">2021-12-06</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  SparseArray            1.5.25    <span style="color: #555555;">2024-07-21</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  SparseArray            1.5.41    <span style="color: #555555;">2024-09-27</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  statnet.common         4.9.0     <span style="color: #555555;">2023-05-24</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  stringi                1.8.4     <span style="color: #555555;">2024-05-06</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  stringr                1.5.1     <span style="color: #555555;">2023-11-14</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  SummarizedExperiment   1.35.1    <span style="color: #555555;">2024-06-28</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
+<span><span class="co">#&gt;  SummarizedExperiment   1.35.2    <span style="color: #555555;">2024-09-27</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.1)</span></span></span>
 <span><span class="co">#&gt;  syntenet             * 1.7.0     <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  systemfonts            1.1.0     <span style="color: #555555;">2024-05-15</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  textshaping            0.4.0     <span style="color: #555555;">2024-05-24</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
@@ -1401,12 +1395,12 @@ <h2 class="unnumbered" id="session-information">Session information<a class="anc
 <span><span class="co">#&gt;  UCSC.utils             1.1.0     <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  utf8                   1.2.4     <span style="color: #555555;">2023-10-22</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  vctrs                  0.6.5     <span style="color: #555555;">2023-12-01</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  withr                  3.0.0     <span style="color: #555555;">2024-01-16</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  xfun                   0.46      <span style="color: #555555;">2024-07-18</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  withr                  3.0.1     <span style="color: #555555;">2024-07-31</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  xfun                   0.47      <span style="color: #555555;">2024-08-17</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  XML                    3.99-0.17 <span style="color: #555555;">2024-06-25</span> <span style="color: #555555;">[1]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  xml2                   1.3.6     <span style="color: #555555;">2023-12-04</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  XVector                0.45.0    <span style="color: #555555;">2024-05-01</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
-<span><span class="co">#&gt;  yaml                   2.3.9     <span style="color: #555555;">2024-07-05</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
+<span><span class="co">#&gt;  yaml                   2.3.10    <span style="color: #555555;">2024-07-26</span> <span style="color: #555555;">[2]</span> <span style="color: #BB00BB; font-weight: bold;">RSPM (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt;  zlibbioc               1.51.1    <span style="color: #555555;">2024-06-05</span> <span style="color: #555555;">[1]</span> <span style="color: #555555;">Bioconductor 3.20 (R 4.4.0)</span></span></span>
 <span><span class="co">#&gt; </span></span>
 <span><span class="co">#&gt; <span style="color: #555555;"> [1] /__w/_temp/Library</span></span></span>
@@ -1472,7 +1466,7 @@ <h2 class="unnumbered" id="references">References<a class="anchor" aria-label="a
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer>
diff --git a/articles/doubletrouble_vignette_files/figure-html/find_ks_peaks-1.png b/articles/doubletrouble_vignette_files/figure-html/find_ks_peaks-1.png
index 14ecb31..5f18a13 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/find_ks_peaks-1.png and b/articles/doubletrouble_vignette_files/figure-html/find_ks_peaks-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/find_peaks_explicit-1.png b/articles/doubletrouble_vignette_files/figure-html/find_peaks_explicit-1.png
index 0b67df6..ba97bdc 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/find_peaks_explicit-1.png and b/articles/doubletrouble_vignette_files/figure-html/find_peaks_explicit-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/ks_eda-1.png b/articles/doubletrouble_vignette_files/figure-html/ks_eda-1.png
index ccee6ff..143a111 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/ks_eda-1.png and b/articles/doubletrouble_vignette_files/figure-html/ks_eda-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/sizer-1.png b/articles/doubletrouble_vignette_files/figure-html/sizer-1.png
index 80c8e19..0f89683 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/sizer-1.png and b/articles/doubletrouble_vignette_files/figure-html/sizer-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/split_by_peak-1.png b/articles/doubletrouble_vignette_files/figure-html/split_by_peak-1.png
index 9ec0cf7..7d8d791 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/split_by_peak-1.png and b/articles/doubletrouble_vignette_files/figure-html/split_by_peak-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-10-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-10-1.png
new file mode 100644
index 0000000..089d945
Binary files /dev/null and b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-10-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-5-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-5-1.png
deleted file mode 100644
index 367b253..0000000
Binary files a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-5-1.png and /dev/null differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png
index 72461c6..367b253 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png and b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-6-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png
index a6a713f..72461c6 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png and b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png
index 0da928f..a6a713f 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png and b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-8-1.png differ
diff --git a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png
index 089d945..0da928f 100644
Binary files a/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png and b/articles/doubletrouble_vignette_files/figure-html/unnamed-chunk-9-1.png differ
diff --git a/articles/index.html b/articles/index.html
index 0c077b1..4ec84ce 100644
--- a/articles/index.html
+++ b/articles/index.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -49,7 +49,7 @@ <h3>All vignettes</h3>
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/authors.html b/authors.html
index b344187..7691a70 100644
--- a/authors.html
+++ b/authors.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -53,13 +53,13 @@ <h2 id="citation">Citation</h2>
 
       <p>Almeida-Silva F, Van de Peer Y (2024).
 <em>doubletrouble: Identification and classification of duplicated genes</em>.
-R package version 1.5.1, <a href="https://github.com/almeidasilvaf/doubletrouble" class="external-link">https://github.com/almeidasilvaf/doubletrouble</a>.
+R package version 1.5.2, <a href="https://github.com/almeidasilvaf/doubletrouble" class="external-link">https://github.com/almeidasilvaf/doubletrouble</a>.
 </p>
       <pre>@Manual{,
   title = {doubletrouble: Identification and classification of duplicated genes},
   author = {Fabrício Almeida-Silva and Yves {Van de Peer}},
   year = {2024},
-  note = {R package version 1.5.1},
+  note = {R package version 1.5.2},
   url = {https://github.com/almeidasilvaf/doubletrouble},
 }</pre>
     </div>
@@ -73,7 +73,7 @@ <h2 id="citation">Citation</h2>
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/index.html b/index.html
index 692e49c..1a6a216 100644
--- a/index.html
+++ b/index.html
@@ -25,7 +25,7 @@
 
     <a class="navbar-brand me-2" href="index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -64,24 +64,24 @@
 
 <p>The major goal of <strong>doubletrouble</strong> is to identify duplicated genes from whole-genome protein sequences and classify them based on their modes of duplication. Duplicates can be classified using four different classification schemes, which increase the complexity and level of details in a stepwise manner. The classification schemes and the duplication modes they can classify are:</p>
 <table class="table">
-<thead><tr class="header">
+<thead><tr>
 <th align="left">Scheme</th>
 <th align="left">Duplication modes</th>
 </tr></thead>
 <tbody>
-<tr class="odd">
+<tr>
 <td align="left">binary</td>
 <td align="left">SD, SSD</td>
 </tr>
-<tr class="even">
+<tr>
 <td align="left">standard</td>
 <td align="left">SD, TD, PD, DD</td>
 </tr>
-<tr class="odd">
+<tr>
 <td align="left">extended</td>
 <td align="left">SD, TD, PD, TRD, DD</td>
 </tr>
-<tr class="even">
+<tr>
 <td align="left">full</td>
 <td align="left">SD, TD, PD, rTRD, dTRD, DD</td>
 </tr>
@@ -205,7 +205,7 @@ <h2 data-toc-skip>Dev status</h2>
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer>
diff --git a/news/index.html b/news/index.html
index 543500e..f355a1f 100644
--- a/news/index.html
+++ b/news/index.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -59,7 +59,7 @@ <h2 class="pkg-version" data-toc-text="0.99.3" id="doubletrouble-0993">doubletro
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/pkgdown.js b/pkgdown.js
index 9757bf9..1a99c65 100644
--- a/pkgdown.js
+++ b/pkgdown.js
@@ -152,3 +152,11 @@ async function searchFuse(query, callback) {
   });
   });
 })(window.jQuery || window.$)
+
+document.addEventListener('keydown', function(event) {
+  // Check if the pressed key is '/'
+  if (event.key === '/') {
+    event.preventDefault();  // Prevent any default action associated with the '/' key
+    document.getElementById('search-input').focus();  // Set focus to the search input
+  }
+});
diff --git a/pkgdown.yml b/pkgdown.yml
index 6dbd635..142412d 100644
--- a/pkgdown.yml
+++ b/pkgdown.yml
@@ -1,6 +1,6 @@
-pandoc: '3.2'
-pkgdown: 2.1.0
+pandoc: '3.4'
+pkgdown: 2.1.1
 pkgdown_sha: ~
 articles:
   doubletrouble_vignette: doubletrouble_vignette.html
-last_built: 2024-07-25T09:05Z
+last_built: 2024-10-02T09:48Z
diff --git a/reference/Rplot001.png b/reference/Rplot001.png
deleted file mode 100644
index 17a3580..0000000
Binary files a/reference/Rplot001.png and /dev/null differ
diff --git a/reference/cds_scerevisiae.html b/reference/cds_scerevisiae.html
index ad218f7..380949b 100644
--- a/reference/cds_scerevisiae.html
+++ b/reference/cds_scerevisiae.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -67,7 +67,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/classify_gene_pairs.html b/reference/classify_gene_pairs.html
index 73e3a70..8b6020a 100644
--- a/reference/classify_gene_pairs.html
+++ b/reference/classify_gene_pairs.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -175,8 +175,8 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 <span class="r-msg co"><span class="r-pr">#&gt;</span>     as.data.frame, basename, cbind, colnames, dirname, do.call,</span>
 <span class="r-msg co"><span class="r-pr">#&gt;</span>     duplicated, eval, evalq, get, grep, grepl, intersect, is.unsorted,</span>
 <span class="r-msg co"><span class="r-pr">#&gt;</span>     lapply, mapply, match, mget, order, paste, pmax, pmax.int, pmin,</span>
-<span class="r-msg co"><span class="r-pr">#&gt;</span>     pmin.int, rank, rbind, rownames, sapply, setdiff, table, tapply,</span>
-<span class="r-msg co"><span class="r-pr">#&gt;</span>     union, unique, unsplit, which.max, which.min</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span>     pmin.int, rank, rbind, rownames, sapply, saveRDS, setdiff, table,</span>
+<span class="r-msg co"><span class="r-pr">#&gt;</span>     tapply, union, unique, unsplit, which.max, which.min</span>
 <span class="r-msg co"><span class="r-pr">#&gt;</span> Loading required package: S4Vectors</span>
 <span class="r-msg co"><span class="r-pr">#&gt;</span> Loading required package: stats4</span>
 <span class="r-msg co"><span class="r-pr">#&gt;</span> </span>
@@ -239,7 +239,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/classify_genes.html b/reference/classify_genes.html
index e174262..c1fb1c6 100644
--- a/reference/classify_genes.html
+++ b/reference/classify_genes.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -90,7 +90,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/diamond_inter.html b/reference/diamond_inter.html
index eb05f07..3ad9090 100644
--- a/reference/diamond_inter.html
+++ b/reference/diamond_inter.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -68,7 +68,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/diamond_intra.html b/reference/diamond_intra.html
index 34e9b7c..bf5474c 100644
--- a/reference/diamond_intra.html
+++ b/reference/diamond_intra.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -65,7 +65,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/duplicates2counts.html b/reference/duplicates2counts.html
index 8bec5a0..266d889 100644
--- a/reference/duplicates2counts.html
+++ b/reference/duplicates2counts.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -100,7 +100,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/find_ks_peaks.html b/reference/find_ks_peaks.html
index 61ea4b4..b7882cc 100644
--- a/reference/find_ks_peaks.html
+++ b/reference/find_ks_peaks.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -129,7 +129,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/fungi_kaks.html b/reference/fungi_kaks.html
index 86a2790..7605bba 100644
--- a/reference/fungi_kaks.html
+++ b/reference/fungi_kaks.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -88,7 +88,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_anchors_list.html b/reference/get_anchors_list.html
index c6a051b..b395a39 100644
--- a/reference/get_anchors_list.html
+++ b/reference/get_anchors_list.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -121,7 +121,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_intron_counts.html b/reference/get_intron_counts.html
index 98a65ca..c01380e 100644
--- a/reference/get_intron_counts.html
+++ b/reference/get_intron_counts.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -96,7 +96,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_segmental.html b/reference/get_segmental.html
index d26a572..e79bfd3 100644
--- a/reference/get_segmental.html
+++ b/reference/get_segmental.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -104,7 +104,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_tandem_proximal.html b/reference/get_tandem_proximal.html
index 8ad2f5c..3b58baf 100644
--- a/reference/get_tandem_proximal.html
+++ b/reference/get_tandem_proximal.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -115,7 +115,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_transposed.html b/reference/get_transposed.html
index f85fb49..c2ef887 100644
--- a/reference/get_transposed.html
+++ b/reference/get_transposed.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -152,7 +152,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/get_transposed_classes.html b/reference/get_transposed_classes.html
index 680e8e8..403a890 100644
--- a/reference/get_transposed_classes.html
+++ b/reference/get_transposed_classes.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -124,7 +124,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/gmax_ks.html b/reference/gmax_ks.html
index 1d9372c..765d2df 100644
--- a/reference/gmax_ks.html
+++ b/reference/gmax_ks.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -59,6 +59,9 @@ <h2 id="format">Format<a class="anchor" aria-label="anchor" href="#format"></a><
 <dt>Ks</dt>
 <dd><p>Numeric, Ks values.</p></dd>
 
+<dt>type</dt>
+<dd><p>Factor, duplication mode.</p></dd>
+
 
 </dl></div>
 
@@ -76,7 +79,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/index.html b/reference/index.html
index b0e56ad..b1c29c3 100644
--- a/reference/index.html
+++ b/reference/index.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -192,7 +192,7 @@ <h2 id="all-functions">All functions<a class="anchor" aria-label="anchor" href="
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/pairs2kaks.html b/reference/pairs2kaks.html
index 228db17..26361e5 100644
--- a/reference/pairs2kaks.html
+++ b/reference/pairs2kaks.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -42,7 +42,7 @@
 
     <div class="section level2">
     <h2 id="ref-usage">Usage<a class="anchor" aria-label="anchor" href="#ref-usage"></a></h2>
-    <div class="sourceCode"><pre class="sourceCode r"><code><span><span class="fu">pairs2kaks</span><span class="op">(</span><span class="va">gene_pairs_list</span>, <span class="va">cds</span>, model <span class="op">=</span> <span class="st">"MYN"</span>, threads <span class="op">=</span> <span class="fl">1</span><span class="op">)</span></span></code></pre></div>
+    <div class="sourceCode"><pre class="sourceCode r"><code><span><span class="fu">pairs2kaks</span><span class="op">(</span><span class="va">gene_pairs_list</span>, <span class="va">cds</span>, model <span class="op">=</span> <span class="st">"MYN"</span>, threads <span class="op">=</span> <span class="fl">1</span>, verbose <span class="op">=</span> <span class="cn">FALSE</span><span class="op">)</span></span></code></pre></div>
     </div>
 
     <div class="section level2">
@@ -69,6 +69,11 @@ <h2 id="arguments">Arguments<a class="anchor" aria-label="anchor" href="#argumen
 <dt id="arg-threads">threads<a class="anchor" aria-label="anchor" href="#arg-threads"></a></dt>
 <dd><p>Numeric indicating the number of threads to use. Default: 1.</p></dd>
 
+
+<dt id="arg-verbose">verbose<a class="anchor" aria-label="anchor" href="#arg-verbose"></a></dt>
+<dd><p>Logical indicating whether progress messages should be
+printed on screen. Default: FALSE.</p></dd>
+
 </dl></div>
     <div class="section level2">
     <h2 id="value">Value<a class="anchor" aria-label="anchor" href="#value"></a></h2>
@@ -111,7 +116,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/plot_duplicate_freqs-1.png b/reference/plot_duplicate_freqs-1.png
index ce3f0c1..bda3ee4 100644
Binary files a/reference/plot_duplicate_freqs-1.png and b/reference/plot_duplicate_freqs-1.png differ
diff --git a/reference/plot_duplicate_freqs.html b/reference/plot_duplicate_freqs.html
index 2286f47..f4e7384 100644
--- a/reference/plot_duplicate_freqs.html
+++ b/reference/plot_duplicate_freqs.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -97,7 +97,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/plot_ks_distro-1.png b/reference/plot_ks_distro-1.png
index 584c885..9052733 100644
Binary files a/reference/plot_ks_distro-1.png and b/reference/plot_ks_distro-1.png differ
diff --git a/reference/plot_ks_distro.html b/reference/plot_ks_distro.html
index 2b565f0..ef2f393 100644
--- a/reference/plot_ks_distro.html
+++ b/reference/plot_ks_distro.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -119,7 +119,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/plot_ks_peaks-1.png b/reference/plot_ks_peaks-1.png
index 967cb1e..b7f2497 100644
Binary files a/reference/plot_ks_peaks-1.png and b/reference/plot_ks_peaks-1.png differ
diff --git a/reference/plot_ks_peaks.html b/reference/plot_ks_peaks.html
index b55cd90..8ab1fb2 100644
--- a/reference/plot_ks_peaks.html
+++ b/reference/plot_ks_peaks.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -88,7 +88,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/plot_rates_by_species-1.png b/reference/plot_rates_by_species-1.png
index dd6adc6..9416095 100644
Binary files a/reference/plot_rates_by_species-1.png and b/reference/plot_rates_by_species-1.png differ
diff --git a/reference/plot_rates_by_species.html b/reference/plot_rates_by_species.html
index 34604d0..039c5cd 100644
--- a/reference/plot_rates_by_species.html
+++ b/reference/plot_rates_by_species.html
@@ -7,7 +7,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -115,7 +115,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/split_pairs_by_peak.html b/reference/split_pairs_by_peak.html
index 3b61336..ae28cbf 100644
--- a/reference/split_pairs_by_peak.html
+++ b/reference/split_pairs_by_peak.html
@@ -13,7 +13,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -119,7 +119,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/yeast_annot.html b/reference/yeast_annot.html
index 24b028c..5039f15 100644
--- a/reference/yeast_annot.html
+++ b/reference/yeast_annot.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -68,7 +68,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/reference/yeast_seq.html b/reference/yeast_seq.html
index 5a19ad0..c0cecc2 100644
--- a/reference/yeast_seq.html
+++ b/reference/yeast_seq.html
@@ -9,7 +9,7 @@
 
     <a class="navbar-brand me-2" href="../index.html">doubletrouble</a>
 
-    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.1</small>
+    <small class="nav-text text-muted me-auto" data-bs-toggle="tooltip" data-bs-placement="bottom" title="">1.5.2</small>
 
 
     <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbar" aria-controls="navbar" aria-expanded="false" aria-label="Toggle navigation">
@@ -68,7 +68,7 @@ <h2 id="ref-examples">Examples<a class="anchor" aria-label="anchor" href="#ref-e
 </div>
 
 <div class="pkgdown-footer-right">
-  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.0.</p>
+  <p>Site built with <a href="https://pkgdown.r-lib.org/" class="external-link">pkgdown</a> 2.1.1.</p>
 </div>
 
     </footer></div>
diff --git a/search.json b/search.json
index e2ebdd2..f52db3a 100644
--- a/search.json
+++ b/search.json
@@ -1 +1 @@
-[{"path":"/CONTRIBUTING.html","id":null,"dir":"","previous_headings":"","what":"Contributing to doubletrouble","title":"Contributing to doubletrouble","text":"outlines propose change doubletrouble. detailed info contributing , tidyverse packages, please see development contributing guide.","code":""},{"path":"/CONTRIBUTING.html","id":"fixing-typos","dir":"","previous_headings":"","what":"Fixing typos","title":"Contributing to doubletrouble","text":"can fix typos, spelling mistakes, grammatical errors documentation directly using GitHub web interface, long changes made source file. generally means ’ll need edit roxygen2 comments .R, .Rd file. can find .R file generates .Rd reading comment first line.","code":""},{"path":"/CONTRIBUTING.html","id":"bigger-changes","dir":"","previous_headings":"","what":"Bigger changes","title":"Contributing to doubletrouble","text":"want make bigger change, ’s good idea first file issue make sure someone team agrees ’s needed. ’ve found bug, please file issue illustrates bug minimal reprex (also help write unit test, needed).","code":""},{"path":"/CONTRIBUTING.html","id":"pull-request-process","dir":"","previous_headings":"Bigger changes","what":"Pull request process","title":"Contributing to doubletrouble","text":"Fork package clone onto computer. haven’t done , recommend using usethis::create_from_github(\"almeidasilvaf/doubletrouble\", fork = TRUE). Install development dependencies devtools::install_dev_deps(), make sure package passes R CMD check running devtools::check(). R CMD check doesn’t pass cleanly, ’s good idea ask help continuing. Create Git branch pull request (PR). recommend using usethis::pr_init(\"brief-description--change\"). Make changes, commit git, create PR running usethis::pr_push(), following prompts browser. title PR briefly describe change. body PR contain Fixes #issue-number. user-facing changes, add bullet top NEWS.md (.e. just first header). Follow style described https://style.tidyverse.org/news.html.","code":""},{"path":"/CONTRIBUTING.html","id":"code-style","dir":"","previous_headings":"Bigger changes","what":"Code style","title":"Contributing to doubletrouble","text":"New code follow tidyverse style guide. can use styler package apply styles, please don’t restyle code nothing PR. use roxygen2, Markdown syntax, documentation. use testthat unit tests. Contributions test cases included easier accept.","code":""},{"path":"/CONTRIBUTING.html","id":"code-of-conduct","dir":"","previous_headings":"","what":"Code of Conduct","title":"Contributing to doubletrouble","text":"Please note doubletrouble project released Contributor Code Conduct. contributing project agree abide terms.","code":""},{"path":"/SUPPORT.html","id":null,"dir":"","previous_headings":"","what":"Getting help with doubletrouble","title":"Getting help with doubletrouble","text":"Thanks using doubletrouble! filing issue, places explore pieces put together make process smooth possible.","code":""},{"path":"/SUPPORT.html","id":"make-a-reprex","dir":"","previous_headings":"","what":"Make a reprex","title":"Getting help with doubletrouble","text":"Start making minimal reproducible example using reprex package. haven’t heard used reprex , ’re treat! Seriously, reprex make R-question-asking endeavors easier (pretty insane ROI five ten minutes ’ll take learn ’s ). additional reprex pointers, check Get help! section tidyverse site.","code":""},{"path":"/SUPPORT.html","id":"where-to-ask","dir":"","previous_headings":"","what":"Where to ask?","title":"Getting help with doubletrouble","text":"Armed reprex, next step figure ask. See also Bioconductor help website. ’s question: start community.rstudio.com, /StackOverflow. Bioconductor-related question, please ask Bioconductor Support Website using appropriate package tag (website send automatic email package authors). people answer questions. ’s bug: ’re right place, file issue. ’re sure: let community help figure ! problem bug feature request, can easily return report . opening new issue, sure search issues pull requests make sure bug hasn’t reported /already fixed development version. default, search pre-populated :issue :open. can edit qualifiers (e.g. :pr, :closed) needed. example, ’d simply remove :open search issues repo, open closed.","code":""},{"path":"/SUPPORT.html","id":"what-happens-next","dir":"","previous_headings":"","what":"What happens next?","title":"Getting help with doubletrouble","text":"efficient possible, development tidyverse packages tends bursty, shouldn’t worry don’t get immediate response. Typically don’t look repo sufficient quantity issues accumulates, ’s burst intense activity focus efforts. makes development efficient avoids expensive context switching problems, cost taking longer get back . process makes good reprex particularly important might multiple months initial report start working . can’t reproduce bug, can’t fix !","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"introduction","dir":"Articles","previous_headings":"","what":"Introduction","title":"Identification and classification of duplicated genes","text":"Gene genome duplications source raw genetic material evolution (Ohno 2013). However, whole-genome duplications (WGD) small-scale duplications (SSD) contribute genome evolution different manners. help explore different contributions WGD SSD evolution, developed doubletrouble, package can used identify classify duplicated genes whole-genome protein sequences, calculate substitution rates per substitution site (.e., KaK_a KsK_s) gene pairs, find peaks KsK_s distributions, classify gene pairs age groups.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"installation","dir":"Articles","previous_headings":"","what":"Installation","title":"Identification and classification of duplicated genes","text":"can install doubletrouble Bioconductor following code: , can load package:","code":"if(!requireNamespace(\"BiocManager\", quietly = TRUE)) {     install.packages(\"BiocManager\") }  BiocManager::install(\"doubletrouble\")  ## Check that you have a valid Bioconductor installation BiocManager::valid() library(doubletrouble)"},{"path":"/articles/doubletrouble_vignette.html","id":"data-description","dir":"Articles","previous_headings":"","what":"Data description","title":"Identification and classification of duplicated genes","text":"vignette, use protein sequences (primary transcripts ) genome annotation yeast species Saccharomyces cerevisiae Candida glabrata. Data obtained Ensembl Fungi release 54 (Yates et al. 2022). example data sets stored following objects: yeast_seq: list AAStringSet objects elements named Scerevisiae Cglabrata. yeast_annot: GRangesList object elements named Scerevisiae Cglabrata. IMPORTANT: protein sequences FASTA files directory, can read list AAStringSet objects function fasta2AAStringSetlist() Bioconductor package syntenet. Likewise, can get GRangesList object GFF/GTF files function gff2GRangesList(), also syntenet. goal identify classify duplicated genes S. cerevisiae genome. C. glabrata genome used outgroup identify transposed duplicates later vignette.","code":"# Load list of DIAMOND tabular output data(yeast_seq) head(yeast_seq) #> $Scerevisiae #> AAStringSet object of length 6600: #>        width seq                                            names                #>    [1]  4910 MSQDRILLDLDVVNQRLILFNS...SELPEMLSLILRQYFTDLASS YLR106C #>    [2]  4092 MCKNEARLANELIEFVAATVTG...NYERLQAKEVASSTEQLLQEM YKR054C #>    [3]  3744 MSLTEQIEQFASRFRDDDATLQ...IGSAVSPRNLARTDVNFMPWF YHR099W #>    [4]  3268 MVLFTRCEKARKEKLAAGYKPL...ETLRGSLLLAINEGHEGFGLA YDR457W #>    [5]  3144 MLESLAANLLNRLLGSYVENFD...SLYRNIAIAVREYNKYCEAIL YLL040C #>    ...   ... ... #> [6596]    25 MFSLSNSQYTCQDYISDHIWKTSSH                      YOR302W #> [6597]    25 MRAKWRKKRTRRLKRKRRKVRARSK                      YDL133C-A #> [6598]    24 MHSNNSRQILIPHQNENMFLTELY                       YDL247W-A #> [6599]    24 MLVLYRKRFSGFRFYFLSIFKYII                       YBR191W-A #> [6600]    16 MLSLIFYLRFPSYIRG                               YJR151W-A #>  #> $Cglabrata #> AAStringSet object of length 5293: #>        width seq                                            names                #>    [1]  4880 MSIQSADTVVFDLDKAFQRRDE...VELPEMLALILRQYFSDLASQ CAGL0M11616g #>    [2]  4336 MYCIIRLCLLLLYMVRFAAAIV...ITFLGIKKCIILLIIVVVSIA CAGL0I10147g #>    [3]  4041 MVQRNIELARYITTLLIGVCPK...NDIESKVLDDTKQLLNSIEYV CAGL0K08294g #>    [4]  3743 MASADQISEYAEKLKDDQQSLA...ISASVNPRNLAKTDISFMPWF CAGL0A01914g #>    [5]  3247 MVKLTRFEKLQKEKNAEYFKPF...DTLRGSLLIAINEGHEGFGLA CAGL0K06303g #>    ...   ... ... #> [5289]    43 MLGAPISRDTPRKTRSKTQFFQGPIVSLITEKCTYEWGNPSIN    CAGL0M02541g #> [5290]    39 MLPGGPIVVLILVGLAACIIVATIIYRKWQERQRALARF        CAGL0M03305g #> [5291]    39 MLPGGVILVFILVGLAACAIVAVIIYRKWQERQRSLQRF        CAGL0L08008g #> [5292]    37 MINEGQLQTLVIGFGLAMVVLVVVYHAVASTMAVKRD          CAGL0C05461g #> [5293]    34 MQPTIEATQKDNTQEKRDNYIVKGFFWSPDCVIA             CAGL0C01919g # Load annotation list processed with syntenet::process_input() data(yeast_annot) head(yeast_annot) #> GRangesList object of length 2: #> $Scerevisiae #> GRanges object with 27144 ranges and 9 metadata columns: #>           seqnames        ranges strand |       type     phase #>              <Rle>     <IRanges>  <Rle> |   <factor> <integer> #>       [1]        I      1-230218      * | chromosome      <NA> #>       [2]        I       335-649      + | gene            <NA> #>       [3]        I       335-649      + | mRNA            <NA> #>       [4]        I       335-649      + | exon            <NA> #>       [5]        I       335-649      + | CDS                0 #>       ...      ...           ...    ... .        ...       ... #>   [27140]      XVI 944603-947701      + |       CDS          0 #>   [27141]      XVI 946856-947338      - |       gene      <NA> #>   [27142]      XVI 946856-947338      - |       mRNA      <NA> #>   [27143]      XVI 946856-947338      - |       exon      <NA> #>   [27144]      XVI 946856-947338      - |       CDS          0 #>                               ID                 Parent              Name #>                      <character>        <CharacterList>       <character> #>       [1]           chromosome:I                                     <NA> #>       [2]           gene:YAL069W                                     <NA> #>       [3] transcript:YAL069W_m..           gene:YAL069W              <NA> #>       [4]                   <NA> transcript:YAL069W_m..   YAL069W_mRNA-E1 #>       [5]            CDS:YAL069W transcript:YAL069W_m..              <NA> #>       ...                    ...                    ...               ... #>   [27140]            CDS:YPR204W transcript:YPR204W_m..              <NA> #>   [27141]         gene:YPR204C-A                                     <NA> #>   [27142] transcript:YPR204C-A..         gene:YPR204C-A              <NA> #>   [27143]                   <NA> transcript:YPR204C-A.. YPR204C-A_mRNA-E1 #>   [27144]          CDS:YPR204C-A transcript:YPR204C-A..              <NA> #>               gene_id  transcript_id           exon_id  protein_id #>           <character>    <character>       <character> <character> #>       [1]        <NA>           <NA>              <NA>        <NA> #>       [2]     YAL069W           <NA>              <NA>        <NA> #>       [3]        <NA>   YAL069W_mRNA              <NA>        <NA> #>       [4]        <NA>           <NA>   YAL069W_mRNA-E1        <NA> #>       [5]        <NA>           <NA>              <NA>     YAL069W #>       ...         ...            ...               ...         ... #>   [27140]        <NA>           <NA>              <NA>     YPR204W #>   [27141]   YPR204C-A           <NA>              <NA>        <NA> #>   [27142]        <NA> YPR204C-A_mRNA              <NA>        <NA> #>   [27143]        <NA>           <NA> YPR204C-A_mRNA-E1        <NA> #>   [27144]        <NA>           <NA>              <NA>   YPR204C-A #>   ------- #>   seqinfo: 31 sequences from an unspecified genome; no seqlengths #>  #> $Cglabrata #> GRanges object with 31671 ranges and 9 metadata columns: #>                         seqnames      ranges strand |     type     phase #>                            <Rle>   <IRanges>  <Rle> | <factor> <integer> #>       [1] ChrA_C_glabrata_CBS138    1-491328      * |   region      <NA> #>       [2] ChrA_C_glabrata_CBS138   1608-2636      - |   gene        <NA> #>       [3] ChrA_C_glabrata_CBS138   1608-2636      - |   mRNA        <NA> #>       [4] ChrA_C_glabrata_CBS138   1608-2636      - |   exon        <NA> #>       [5] ChrA_C_glabrata_CBS138   1608-2636      - |   CDS            0 #>       ...                    ...         ...    ... .      ...       ... #>   [31667] mito_C_glabrata_CBS138 15384-16067      + |     CDS          0 #>   [31668] mito_C_glabrata_CBS138 16756-17565      + |     gene      <NA> #>   [31669] mito_C_glabrata_CBS138 16756-17565      + |     mRNA      <NA> #>   [31670] mito_C_glabrata_CBS138 16756-17565      + |     exon      <NA> #>   [31671] mito_C_glabrata_CBS138 16756-17565      + |     CDS          0 #>                               ID                 Parent              Name #>                      <character>        <CharacterList>       <character> #>       [1] region:ChrA_C_glabra..                                     <NA> #>       [2]      gene:CAGL0A00105g                                     <NA> #>       [3] transcript:CAGL0A001..      gene:CAGL0A00105g              <NA> #>       [4]                   <NA> transcript:CAGL0A001.. CAGL0A00105g-T-E1 #>       [5]  CDS:CAGL0A00105g-T-p1 transcript:CAGL0A001..              <NA> #>       ...                    ...                    ...               ... #>   [31667]     CDS:CaglfMp11-T-p1 transcript:CaglfMp11-T              <NA> #>   [31668]         gene:CaglfMp12                                     COX3 #>   [31669] transcript:CaglfMp12-T         gene:CaglfMp12              <NA> #>   [31670]                   <NA> transcript:CaglfMp12-T    CaglfMp12-T-E1 #>   [31671]     CDS:CaglfMp12-T-p1 transcript:CaglfMp12-T              <NA> #>                gene_id  transcript_id           exon_id        protein_id #>            <character>    <character>       <character>       <character> #>       [1]         <NA>           <NA>              <NA>              <NA> #>       [2] CAGL0A00105g           <NA>              <NA>              <NA> #>       [3]         <NA> CAGL0A00105g-T              <NA>              <NA> #>       [4]         <NA>           <NA> CAGL0A00105g-T-E1              <NA> #>       [5]         <NA>           <NA>              <NA> CAGL0A00105g-T-p1 #>       ...          ...            ...               ...               ... #>   [31667]         <NA>           <NA>              <NA>    CaglfMp11-T-p1 #>   [31668]    CaglfMp12           <NA>              <NA>              <NA> #>   [31669]         <NA>    CaglfMp12-T              <NA>              <NA> #>   [31670]         <NA>           <NA>    CaglfMp12-T-E1              <NA> #>   [31671]         <NA>           <NA>              <NA>    CaglfMp12-T-p1 #>   ------- #>   seqinfo: 31 sequences from an unspecified genome; no seqlengths"},{"path":"/articles/doubletrouble_vignette.html","id":"data-preparation","dir":"Articles","previous_headings":"","what":"Data preparation","title":"Identification and classification of duplicated genes","text":"First , need process list protein sequences gene ranges detect synteny syntenet. using function process_input() syntenet package. processed data represented list elements seq annotation, containing protein sequences gene ranges species, respectively. Finally, need perform pairwise sequence similarity searches identify whole set paralogous gene pairs. can using function run_diamond() syntenet package 1, setting compare = \"intraspecies\" perform intraspecies comparisons. voilà! Now DIAMOND output processed annotation, can classify duplicated genes.","code":"library(syntenet)  # Process input data pdata <- process_input(yeast_seq, yeast_annot)  # Inspect the output names(pdata) #> [1] \"seq\"        \"annotation\" pdata$seq #> $Scerevisiae #> AAStringSet object of length 6600: #>        width seq                                            names                #>    [1]  4910 MSQDRILLDLDVVNQRLILFNS...SELPEMLSLILRQYFTDLASS Sce_YLR106C #>    [2]  4092 MCKNEARLANELIEFVAATVTG...NYERLQAKEVASSTEQLLQEM Sce_YKR054C #>    [3]  3744 MSLTEQIEQFASRFRDDDATLQ...IGSAVSPRNLARTDVNFMPWF Sce_YHR099W #>    [4]  3268 MVLFTRCEKARKEKLAAGYKPL...ETLRGSLLLAINEGHEGFGLA Sce_YDR457W #>    [5]  3144 MLESLAANLLNRLLGSYVENFD...SLYRNIAIAVREYNKYCEAIL Sce_YLL040C #>    ...   ... ... #> [6596]    25 MFSLSNSQYTCQDYISDHIWKTSSH                      Sce_YOR302W #> [6597]    25 MRAKWRKKRTRRLKRKRRKVRARSK                      Sce_YDL133C-A #> [6598]    24 MHSNNSRQILIPHQNENMFLTELY                       Sce_YDL247W-A #> [6599]    24 MLVLYRKRFSGFRFYFLSIFKYII                       Sce_YBR191W-A #> [6600]    16 MLSLIFYLRFPSYIRG                               Sce_YJR151W-A #>  #> $Cglabrata #> AAStringSet object of length 5293: #>        width seq                                            names                #>    [1]  4880 MSIQSADTVVFDLDKAFQRRDE...VELPEMLALILRQYFSDLASQ Cgl_CAGL0M11616g #>    [2]  4336 MYCIIRLCLLLLYMVRFAAAIV...ITFLGIKKCIILLIIVVVSIA Cgl_CAGL0I10147g #>    [3]  4041 MVQRNIELARYITTLLIGVCPK...NDIESKVLDDTKQLLNSIEYV Cgl_CAGL0K08294g #>    [4]  3743 MASADQISEYAEKLKDDQQSLA...ISASVNPRNLAKTDISFMPWF Cgl_CAGL0A01914g #>    [5]  3247 MVKLTRFEKLQKEKNAEYFKPF...DTLRGSLLIAINEGHEGFGLA Cgl_CAGL0K06303g #>    ...   ... ... #> [5289]    43 MLGAPISRDTPRKTRSKTQFFQGPIVSLITEKCTYEWGNPSIN    Cgl_CAGL0M02541g #> [5290]    39 MLPGGPIVVLILVGLAACIIVATIIYRKWQERQRALARF        Cgl_CAGL0M03305g #> [5291]    39 MLPGGVILVFILVGLAACAIVAVIIYRKWQERQRSLQRF        Cgl_CAGL0L08008g #> [5292]    37 MINEGQLQTLVIGFGLAMVVLVVVYHAVASTMAVKRD          Cgl_CAGL0C05461g #> [5293]    34 MQPTIEATQKDNTQEKRDNYIVKGFFWSPDCVIA             Cgl_CAGL0C01919g pdata$annotation #> $Scerevisiae #> GRanges object with 6600 ranges and 1 metadata column: #>          seqnames        ranges strand |          gene #>             <Rle>     <IRanges>  <Rle> |   <character> #>      [1]    Sce_I       335-649      + |   Sce_YAL069W #>      [2]    Sce_I       538-792      + | Sce_YAL068W-A #>      [3]    Sce_I     1807-2169      - |   Sce_YAL068C #>      [4]    Sce_I     2480-2707      + | Sce_YAL067W-A #>      [5]    Sce_I     7235-9016      - |   Sce_YAL067C #>      ...      ...           ...    ... .           ... #>   [6596]  Sce_XVI 939922-941136      + |   Sce_YPR201W #>   [6597]  Sce_XVI 943032-943896      + |   Sce_YPR202W #>   [6598]  Sce_XVI 943880-944188      + |   Sce_YPR203W #>   [6599]  Sce_XVI 944603-947701      + |   Sce_YPR204W #>   [6600]  Sce_XVI 946856-947338      - | Sce_YPR204C-A #>   ------- #>   seqinfo: 17 sequences from an unspecified genome; no seqlengths #>  #> $Cglabrata #> GRanges object with 5293 ranges and 1 metadata column: #>                        seqnames      ranges strand |             gene #>                           <Rle>   <IRanges>  <Rle> |      <character> #>      [1] Cgl_ChrA_C_glabrata_..   1608-2636      - | Cgl_CAGL0A00105g #>      [2] Cgl_ChrA_C_glabrata_..   2671-4809      - | Cgl_CAGL0A00116g #>      [3] Cgl_ChrA_C_glabrata_.. 11697-13042      + | Cgl_CAGL0A00132g #>      [4] Cgl_ChrA_C_glabrata_.. 14977-15886      + | Cgl_CAGL0A00154g #>      [5] Cgl_ChrA_C_glabrata_.. 17913-19017      - | Cgl_CAGL0A00165g #>      ...                    ...         ...    ... .              ... #>   [5289] Cgl_mito_C_glabrata_.. 13275-13421      + |    Cgl_CaglfMp08 #>   [5290] Cgl_mito_C_glabrata_.. 13614-14396      + |    Cgl_CaglfMp09 #>   [5291] Cgl_mito_C_glabrata_.. 14631-14861      + |    Cgl_CaglfMp10 #>   [5292] Cgl_mito_C_glabrata_.. 15384-16067      + |    Cgl_CaglfMp11 #>   [5293] Cgl_mito_C_glabrata_.. 16756-17565      + |    Cgl_CaglfMp12 #>   ------- #>   seqinfo: 14 sequences from an unspecified genome; no seqlengths data(diamond_intra)  # Run DIAMOND in sensitive mode for S. cerevisiae only if(diamond_is_installed()) {     diamond_intra <- run_diamond(         seq = pdata$seq[\"Scerevisiae\"],         compare = \"intraspecies\",          outdir = file.path(tempdir(), \"diamond_intra\"),         ... = \"--sensitive\"     ) }  # Inspect output names(diamond_intra) #> [1] \"Scerevisiae_Scerevisiae\" head(diamond_intra$Scerevisiae_Scerevisiae) #>         query          db perc_identity length mismatches gap_open qstart qend #> 1 Sce_YLR106C Sce_YLR106C         100.0   4910          0        0      1 4910 #> 2 Sce_YLR106C Sce_YKR054C          22.4    420        254       19    804 1195 #> 3 Sce_YKR054C Sce_YKR054C         100.0   4092          0        0      1 4092 #> 4 Sce_YKR054C Sce_YLR106C          22.4    420        254       19   1823 2198 #> 5 Sce_YHR099W Sce_YHR099W         100.0   3744          0        0      1 3744 #> 6 Sce_YHR099W Sce_YJR066W          22.7    339        201       12   3351 3674 #>   tstart tend   evalue bitscore #> 1      1 4910 0.00e+00   9095.0 #> 2   1823 2198 1.30e-06     53.1 #> 3      1 4092 0.00e+00   7940.0 #> 4    804 1195 1.09e-06     53.1 #> 5      1 3744 0.00e+00   7334.0 #> 6   2074 2366 6.46e-08     57.0"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-duplicated-gene-pairs-and-genes","dir":"Articles","previous_headings":"","what":"Classifying duplicated gene pairs and genes","title":"Identification and classification of duplicated genes","text":"classify duplicated gene pairs based modes duplication, use function classify_gene_pairs(). function offers four different classification schemes, depending much detail want. classification schemes, along duplication modes identify required input, summarized table : Legend: SD, segmental duplication. SSD, small-scale duplication. TD, tandem duplication. PD, proximal duplication. TRD, transposon-derived duplication. rTRD, retrotransposon-derived duplication. dTRD, DNA transposon-derived duplication. DD, dispersed duplication. shown table, minimal input objects : blast_list: list data frames DIAMOND (BLASTp, etc.) tabular output intraspecies comparisons returned syntenet::run_diamond(..., compare = 'intraspecies'). annotation: processed annotation list (GRangesList object) returned syntenet::process_input(). However, also want identify transposon-derived duplicates (TRD) classify retrotransposon-derived duplicates (rTRD) DNA transposon-derived duplicates (dTRD), need following objects: blast_list: list data frames DIAMOND (BLASTp, etc.) tabular output interspecies comparisons (target species vs outgroup) returned syntenet::run_diamond(..., compare = <comparison_data_frame>). intron_counts: list data frames number introns per gene species, returned get_intron_counts(). , demonstrate classification scheme examples.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"the-binary-scheme-sd-vs-ssd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The binary scheme (SD vs SSD)","title":"Identification and classification of duplicated genes","text":"binary scheme classifies duplicates derived either segmental duplications (SD) small-scale duplications (SSD). identify segmental duplicates, function classify_gene_pairs() performs intragenome synteny detection scans syntenet classifies detected anchor pairs segmental duplicates. remaining pairs classified originating small-scale duplications. scheme can used specifying scheme = \"binary\" function classify_gene_pairs(). function returns list data frames, containing duplicated gene pairs modes duplication species (, one species, list length 1).","code":"# Binary scheme c_binary <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"binary\" )  # Inspecting the output names(c_binary) #> [1] \"Scerevisiae\" head(c_binary$Scerevisiae) #>           dup1        dup2 type #> 9  Sce_YDR457W Sce_YER125W  SSD #> 10 Sce_YDR457W Sce_YJR036C  SSD #> 11 Sce_YDR457W Sce_YGL141W  SSD #> 12 Sce_YDR457W Sce_YKL010C  SSD #> 15 Sce_YBR140C Sce_YOL081W  SSD #> 21 Sce_YBL088C Sce_YBR136W  SSD  # How many pairs are there for each duplication mode? table(c_binary$Scerevisiae$type) #>  #>   SD  SSD  #>  342 3246"},{"path":"/articles/doubletrouble_vignette.html","id":"the-standard-scheme-ssd-td-pd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The standard scheme (SSD → TD, PD, DD)","title":"Identification and classification of duplicated genes","text":"Gene pairs derived small-scale duplications can classified originating tandem duplications (TD, genes adjacent ), proximal duplications (PD, genes separated genes), dispersed duplications (DD, duplicates fit previous categories). default classification scheme classify_gene_pairs(), can specified setting scheme = \"standard\".","code":"# Standard scheme c_standard <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"standard\" )  # Inspecting the output names(c_standard) #> [1] \"Scerevisiae\" head(c_standard$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_standard$Scerevisiae$type) #>  #>   SD   TD   PD   DD  #>  342   42   80 3124"},{"path":"/articles/doubletrouble_vignette.html","id":"the-extended-scheme-ssd-td-pd-trd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The extended scheme (SSD → TD, PD, TRD, DD)","title":"Identification and classification of duplicated genes","text":"find transposon-derived duplicates (TRD), function classify_gene_pairs() detects syntenic regions target species outgroup species. Genes target species syntenic regions outgroup treated ancestral loci. , one gene duplicate pair ancestral locus, duplicate pair classified originating transposon-derived duplications. Since finding transposon-derived duplicates requires comparing target species outgroup species, first need perform similarity search target species outgroup. can syntenet::run_diamond(). parameter compare, pass 2-column data frame specifying comparisons made. 2 , identify duplicated gene pairs Saccharomyces cerevisiae using Candida glabrata outgroup. Now, pass interspecies DIAMOND output argument parameter blast_inter classify_gene_pairs().","code":"data(diamond_inter) # load pre-computed output in case DIAMOND is not installed  # Create data frame of comparisons to be made comparisons <- data.frame(     species = \"Scerevisiae\",     outgroup = \"Cglabrata\" ) comparisons #>       species  outgroup #> 1 Scerevisiae Cglabrata  # Run DIAMOND for the comparison we specified if(diamond_is_installed()) {     diamond_inter <- run_diamond(         seq = pdata$seq,         compare = comparisons,         outdir = file.path(tempdir(), \"diamond_inter\"),         ... = \"--sensitive\"     ) }  names(diamond_inter) #> [1] \"Scerevisiae_Cglabrata\" head(diamond_inter$Scerevisiae_Cglabrata) #>         query               db perc_identity length mismatches gap_open qstart #> 1 Sce_YLR106C Cgl_CAGL0M11616g          52.3   4989       2183       50      2 #> 2 Sce_YLR106C Cgl_CAGL0K08294g          23.1    347        215       12   1064 #> 3 Sce_YKR054C Cgl_CAGL0K08294g          26.5   4114       2753       81     83 #> 4 Sce_YKR054C Cgl_CAGL0M11616g          22.7    419        254       17   1823 #> 5 Sce_YHR099W Cgl_CAGL0A01914g          70.2   3761       1087       17      1 #> 6 Sce_YDR457W Cgl_CAGL0K06303g          55.5   3318       1355       39      1 #>   qend tstart tend   evalue bitscore #> 1 4909      5 4879 0.00e+00   4439.0 #> 2 1389   1770 2085 9.10e-07     53.5 #> 3 4089     87 4035 0.00e+00   1376.0 #> 4 2198    803 1194 7.59e-07     53.5 #> 5 3744      1 3743 0.00e+00   5200.0 #> 6 3268      1 3247 0.00e+00   3302.0 # Extended scheme c_extended <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"extended\",     blast_inter = diamond_inter )  # Inspecting the output names(c_extended) #> [1] \"Scerevisiae\" head(c_extended$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_extended$Scerevisiae$type) #>  #>   SD   TD   PD  TRD   DD  #>  342   42   80 1015 2109"},{"path":"/articles/doubletrouble_vignette.html","id":"the-full-scheme-ssd-td-pd-rtrd-dtrd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The full scheme (SSD → TD, PD, rTRD, dTRD, DD)","title":"Identification and classification of duplicated genes","text":"Finally, full scheme consists classifying transposon-derived duplicates (TRD) originating retrotransposons (rTRD) DNA transposons (dTRD). , function classify_gene_pairs() uses number introns per gene find TRD pairs one gene least 1 intron, gene introns; case, pair classified originating activity retrotransposons (rTRD, .e., transposed gene without introns processed transcript retrotransposed back genome). TRD pairs classified DNA transposon-derived duplicates (dTRD). classify duplicates using scheme, first need create list data frames number introns per gene species. can done function get_intron_counts(), takes TxDb object input. TxDb objects store transcript annotations, can created family functions named makeTxDbFrom* txdbmaker package (see ?get_intron_counts() summary functions). , create list TxDb objects list GRanges objects using function makeTxDbFromGRanges txdbmaker. Importantly, create TxDb GRanges, GRanges object must contain genomic coordinates features, including transcripts, exons, etc. , use annotation example data set yeast_annot, processed syntenet::process_input(). TxDb objects, can get intron counts per gene get_intron_counts(). Finally, can use list classify duplicates using full scheme follows:","code":"library(txdbmaker) #> Loading required package: BiocGenerics #>  #> Attaching package: 'BiocGenerics' #> The following objects are masked from 'package:stats': #>  #>     IQR, mad, sd, var, xtabs #> The following objects are masked from 'package:base': #>  #>     anyDuplicated, aperm, append, as.data.frame, basename, cbind, #>     colnames, dirname, do.call, duplicated, eval, evalq, Filter, Find, #>     get, grep, grepl, intersect, is.unsorted, lapply, Map, mapply, #>     match, mget, order, paste, pmax, pmax.int, pmin, pmin.int, #>     Position, rank, rbind, Reduce, rownames, sapply, setdiff, table, #>     tapply, union, unique, unsplit, which.max, which.min #> Loading required package: S4Vectors #> Loading required package: stats4 #>  #> Attaching package: 'S4Vectors' #> The following object is masked from 'package:utils': #>  #>     findMatches #> The following objects are masked from 'package:base': #>  #>     expand.grid, I, unname #> Loading required package: GenomeInfoDb #> Loading required package: IRanges #> Loading required package: GenomicRanges #> Loading required package: GenomicFeatures #> Loading required package: AnnotationDbi #> Loading required package: Biobase #> Welcome to Bioconductor #>  #>     Vignettes contain introductory material; view with #>     'browseVignettes()'. To cite Bioconductor, see #>     'citation(\"Biobase\")', and for packages 'citation(\"pkgname\")'. #>  #> Attaching package: 'txdbmaker' #> The following objects are masked from 'package:GenomicFeatures': #>  #>     browseUCSCtrack, getChromInfoFromBiomart, makeFDbPackageFromUCSC, #>     makeFeatureDbFromUCSC, makePackageName, makeTxDb, #>     makeTxDbFromBiomart, makeTxDbFromEnsembl, makeTxDbFromGFF, #>     makeTxDbFromGRanges, makeTxDbFromUCSC, makeTxDbPackage, #>     makeTxDbPackageFromBiomart, makeTxDbPackageFromUCSC, #>     supportedMiRBaseBuildValues, supportedUCSCFeatureDbTables, #>     supportedUCSCFeatureDbTracks, supportedUCSCtables, #>     UCSCFeatureDbTableSchema # Create a list of `TxDb` objects from a list of `GRanges` objects txdb_list <- lapply(yeast_annot, txdbmaker::makeTxDbFromGRanges) txdb_list #> $Scerevisiae #> TxDb object: #> # Db type: TxDb #> # Supporting package: GenomicFeatures #> # Genome: NA #> # Nb of transcripts: 6631 #> # Db created by: txdbmaker package from Bioconductor #> # Creation time: 2024-07-25 09:05:44 +0000 (Thu, 25 Jul 2024) #> # txdbmaker version at creation time: 1.1.1 #> # RSQLite version at creation time: 2.3.7 #> # DBSCHEMAVERSION: 1.2 #>  #> $Cglabrata #> TxDb object: #> # Db type: TxDb #> # Supporting package: GenomicFeatures #> # Genome: NA #> # Nb of transcripts: 5389 #> # Db created by: txdbmaker package from Bioconductor #> # Creation time: 2024-07-25 09:05:45 +0000 (Thu, 25 Jul 2024) #> # txdbmaker version at creation time: 1.1.1 #> # RSQLite version at creation time: 2.3.7 #> # DBSCHEMAVERSION: 1.2 # Get a list of data frames with intron counts per gene for each species intron_counts <- lapply(txdb_list, get_intron_counts)  # Inspecting the list names(intron_counts) #> [1] \"Scerevisiae\" \"Cglabrata\" head(intron_counts$Scerevisiae) #>    gene introns #> 1 Q0045       7 #> 2 Q0105       5 #> 3 Q0070       4 #> 4 Q0065       3 #> 5 Q0120       3 #> 6 Q0060       2 # Full scheme c_full <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"full\",     blast_inter = diamond_inter,     intron_counts = intron_counts )  # Inspecting the output names(c_full) #> [1] \"Scerevisiae\" head(c_full$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_full$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  342   42   80   52  963 2109"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-genes-into-unique-modes-of-duplication","dir":"Articles","previous_headings":"","what":"Classifying genes into unique modes of duplication","title":"Identification and classification of duplicated genes","text":"look carefully output classify_gene_pairs(), notice genes appear one duplicate pair, pairs can different duplication modes assigned. ’s nothing wrong . Consider, example, gene originated segmental duplication 60 million years ago, underwent tandem duplication 5 million years ago. output classify_gene_pairs(), ’d see gene two pairs, one SD type column, one TD. want assign gene unique mode duplication, can use function classify_genes(). function assigns duplication modes hierarchically using factor levels column type priority order. priority orders classification scheme : Binary: SD > SSD. Standard: SD > TD > PD > DD. Extended: SD > TD > PD > TRD > DD. Full: SD > TD > PD > rTRD > dTRD > DD. input classify_genes() list gene pairs returned classify_gene_pairs().","code":"# Classify genes into unique modes of duplication c_genes <- classify_genes(c_full)  # Inspecting the output names(c_genes) #> [1] \"Scerevisiae\" head(c_genes$Scerevisiae) #>          gene type #> 1 Sce_YGR032W   SD #> 2 Sce_YOR396W   SD #> 3 Sce_YJL225C   SD #> 4 Sce_YNR031C   SD #> 5 Sce_YOR326W   SD #> 6 Sce_YJL222W   SD  # Number of genes per mode table(c_genes$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  683   67   70   71  883  836"},{"path":"/articles/doubletrouble_vignette.html","id":"calculating-substitution-rates-for-duplicated-gene-pairs","dir":"Articles","previous_headings":"","what":"Calculating substitution rates for duplicated gene pairs","title":"Identification and classification of duplicated genes","text":"can use function pairs2kaks() calculate rates nonsynonymous substitutions per nonsynonymous site (KaK_a), synonymouys substitutions per synonymous site (KsK_s), ratios (Ka/KsK_a/K_s). rates calculated using Bioconductor package MSA2dist, implements codon models KaKs_Calculator 2.0 (Wang et al. 2010). purpose demonstration, calculate KaK_a, KsK_s, Ka/KsK_a/K_s 5 TD-derived gene pairs. CDS TD-derived genes obtained Ensembl Fungi (Yates et al. 2022), stored cds_scerevisiae.","code":"data(cds_scerevisiae) head(cds_scerevisiae) #> DNAStringSet object of length 6: #>     width seq                                               names                #> [1]  3486 ATGGTTAATATAAGCATCGTAGC...TTGTCGCTTTATTACTGCTATAG YJR151C #> [2]  3276 ATGGGCGAAGGAACTACTAAGGA...TTAATATTGGTATTAAACAATGA YDR040C #> [3]  3276 ATGAGCGAGGGAACTGTCAAAGA...TTAATATCAGTGTCAAGCATTAA YDR038C #> [4]  3276 ATGAGCGAGGGAACTGTCAAAGA...TTAATATTGGTATTAAACAATGA YDR039C #> [5]  2925 ATGAACAGTATGGCCGATACCGA...CCATTACAACATTTCAAACATAA YAR019C #> [6]  2646 ATGCTGGAGTTTCCAATATCAGT...TAGCTGTTCTGTTCGCCTTCTAG YJL078C  # Store DNAStringSet object in a list cds_list <- list(Scerevisiae = cds_scerevisiae)  # Keep only top five TD-derived gene pairs for demonstration purposes td_pairs <- c_full$Scerevisiae[c_full$Scerevisiae$type == \"TD\", ] gene_pairs <- list(Scerevisiae = td_pairs[seq(1, 5, by = 1), ])  # Calculate Ka, Ks, and Ka/Ks kaks <- pairs2kaks(gene_pairs, cds_list)  # Inspect the output head(kaks) #> $Scerevisiae #>    dup1  dup2       Ka       Ks    Ka_Ks type #> 1 Q0055 Q0060      NaN      NaN      NaN   TD #> 2 Q0065 Q0060 0.799925 3.549370 0.225371   TD #> 3 Q0070 Q0045 0.296216 0.438575 0.675405   TD #> 4 Q0070 Q0065 0.394617 0.582050 0.677977   TD #> 5 Q0055 Q0050 0.629343 4.257430 0.147822   TD"},{"path":"/articles/doubletrouble_vignette.html","id":"identifying-and-visualizing-k_s-peaks","dir":"Articles","previous_headings":"","what":"Identifying and visualizing KsK_s peaks","title":"Identification and classification of duplicated genes","text":"Peaks KsK_s distributions typically indicate whole-genome duplication (WGD) events, can identified fitting Gaussian mixture models (GMMs) KsK_s distributions. doubletrouble, can performed function find_ks_peaks(). However, saturation higher KsK_s values, recent WGD events can reliably identified KsK_s distributions (Vanneste, Van de Peer, Maere 2013). Recent WGD events commonly found plant species, maize, soybean, apple, etc. Although genomes yeast species signatures WGD, events ancient, hard find evidence using KsK_s distributions. 3 demonstrate can find peaks KsK_s distributions find_ks_peaks(), use data frame containing KsK_s values duplicate pairs soybean (Glycine max) genome, undergone 2 WGDs events ~13 ~58 million years ago (Schmutz et al. 2010). , visualize KsK_s distributions peaks using function plot_ks_peaks(). First , let’s look data quick look distribution function plot_ks_distro() (details function data visualization section).  visual inspection, can see 2 3 peaks. Based prior knowledge, know 2 WGD events occurred ancestral Glycine genus ancestral Fabaceae, seem correspond peaks see KsK_s values around 0.1 0.5, respectively. third, flattened peak around 1.6, represent WGD shared eudicots. Let’s test number peaks support: 2 3.  can see, presence 3 peaks supported (lowest BIC). function returns list mean, variance amplitude mixture components (.e., peaks), well KsK_s distribution . Now, suppose just want get first 2 peaks. can explictly saying find_ks_peaks() many peaks .  Important consideration GMMs KsK_s distributions: Peaks identified GMMs blindly regarded “truth”. Using GMMs find peaks KsK_s distributions can lead problems overfitting overclustering (Tiley, Barker, Burleigh 2018). general recommendations : Use prior knowledge. know many peaks (e.g., based literature evidence), just tell number find_ks_peaks(). Likewise, sure many peaks , know maximum number peaks N, don’t test presence >N peaks. GMMs can incorrectly identify peaks actual number. Test significance peak SiZer (Significant ZERo crossings derivatives) maps (Chaudhuri Marron 1999). can done function SiZer() R package feature. example SiZer map, let’s use feature::SiZer() assess significance 2 peaks found previously.  blue regions SiZer map indicate significantly increasing regions curve, support 2 peaks found.","code":"# Load data and inspect it data(gmax_ks) head(gmax_ks) #>               dup1            dup2     Ks #> 1  GLYMA_01G000100 GLYMA_15G276800 0.3750 #> 3  GLYMA_01G000400 GLYMA_02G312300 0.0453 #> 8  GLYMA_01G000600 GLYMA_14G000400 0.1040 #> 10 GLYMA_01G000800 GLYMA_03G188200 0.4730 #> 11 GLYMA_01G000800 GLYMA_05G115300 1.2300 #> 12 GLYMA_01G000800 GLYMA_17G191100 1.6600  # Plot distribution plot_ks_distro(gmax_ks) # Find 2 and 3 peaks and test which one has more support peaks <- find_ks_peaks(gmax_ks$Ks, npeaks = c(2, 3), verbose = TRUE) #> Optimal number of peaks: 3 #> Bayesian Information Criterion (BIC):  #>           E         V #> 2 -86950.26 -67759.43 #> 3 -86977.90 -54202.26 #>  #> Top 3 models based on the BIC criterion:  #>       V,3       V,2       E,2  #> -54202.26 -67759.43 -86950.26 names(peaks) #> [1] \"mean\"   \"sd\"     \"lambda\" \"ks\" str(peaks) #> List of 4 #>  $ mean  : Named num [1:3] 0.118 0.531 1.482 #>   ..- attr(*, \"names\")= chr [1:3] \"1\" \"2\" \"3\" #>  $ sd    : num [1:3] 0.0549 0.2443 0.3134 #>  $ lambda: num [1:3] 0.352 0.433 0.215 #>  $ ks    : num [1:71232] 0.375 0.0453 0.104 0.473 1.23 1.66 1.72 0.13 0.0856 1.96 ...  # Visualize Ks distribution plot_ks_peaks(peaks) # Find 2 peaks ignoring Ks values > 1 peaks <- find_ks_peaks(gmax_ks$Ks, npeaks = 2, max_ks = 1) plot_ks_peaks(peaks) # Get numeric vector of Ks values <= 1 ks <- gmax_ks$Ks[gmax_ks$Ks <= 1]  # Get SiZer map feature::SiZer(ks) #> Warning: no DISPLAY variable so Tk is not available"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-genes-by-age-groups","dir":"Articles","previous_headings":"","what":"Classifying genes by age groups","title":"Identification and classification of duplicated genes","text":"Finally, can use peaks obtained classify gene pairs age group. Age groups defined based KsK_s peak pairs belong. useful want analyze duplicate pairs specific WGD event, instance. can function split_pairs_by_peak(). function returns list containing classified pairs data frame, ggplot object age boundaries highlighted histogram KsK_s values.","code":"# Gene pairs without age-based classification head(gmax_ks) #>               dup1            dup2     Ks #> 1  GLYMA_01G000100 GLYMA_15G276800 0.3750 #> 3  GLYMA_01G000400 GLYMA_02G312300 0.0453 #> 8  GLYMA_01G000600 GLYMA_14G000400 0.1040 #> 10 GLYMA_01G000800 GLYMA_03G188200 0.4730 #> 11 GLYMA_01G000800 GLYMA_05G115300 1.2300 #> 12 GLYMA_01G000800 GLYMA_17G191100 1.6600  # Classify gene pairs by age group pairs_age_group <- split_pairs_by_peak(gmax_ks, peaks)  # Inspecting the output names(pairs_age_group) #> [1] \"pairs\" \"plot\"  # Take a look at the classified gene pairs head(pairs_age_group$pairs) #>               dup1            dup2     ks peak #> 1  GLYMA_01G000100 GLYMA_15G276800 0.3750    1 #> 3  GLYMA_01G000400 GLYMA_02G312300 0.0453    1 #> 8  GLYMA_01G000600 GLYMA_14G000400 0.1040    1 #> 10 GLYMA_01G000800 GLYMA_03G188200 0.4730    1 #> 16 GLYMA_01G001000 GLYMA_08G359900 0.1300    1 #> 18 GLYMA_01G001100 GLYMA_08G359700 0.0856    1  # Visualize Ks distro with age boundaries pairs_age_group$plot"},{"path":"/articles/doubletrouble_vignette.html","id":"data-visualization","dir":"Articles","previous_headings":"","what":"Data visualization","title":"Identification and classification of duplicated genes","text":"Last least, doubletrouble provides users graphical functions produce publication-ready plots output classify_gene_pairs(), classify_genes(), pairs2kaks(). Let’s take look one one.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-the-frequency-of-duplicates-per-mode","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing the frequency of duplicates per mode","title":"Identification and classification of duplicated genes","text":"visualize frequency duplicated gene pairs genes duplication type (returned classify_gene_pairs() classify_genes(), respectively), first need create data frame counts duplicates2counts(). demonstrate works, use example data set duplicate pairs 3 fungi species (substitution rates, ignored duplicates2counts()). Now, let’s visualize frequency duplicate gene pairs duplication type function plot_duplicate_freqs(). can visualize frequencies three different ways, demonstrated .  want visually frequency duplicated genes (gene pairs), ’d first need classify genes unique modes duplication classify_genes(), repeat code . example:","code":"# Load data set with pre-computed duplicates for 3 fungi species data(fungi_kaks) names(fungi_kaks) #> [1] \"saccharomyces_cerevisiae\"  \"candida_glabrata\"          #> [3] \"schizosaccharomyces_pombe\" head(fungi_kaks$saccharomyces_cerevisiae) #>      dup1    dup2       Ka       Ks  Ka_Ks type #> 1 YGR032W YLR342W 0.058800 5.240000 0.0112   SD #> 2 YOR396W YPL283C 0.004010 0.009920 0.4040   SD #> 3 YJL225C YIL177C 0.000253 0.000758 0.3340   SD #> 4 YNR031C YCR073C 0.364000 5.070000 0.0718   SD #> 5 YOR326W YAL029C 0.396000 5.150000 0.0769   SD #> 6 YJL222W YIL173W 0.000276       NA     NA   SD  # Get a data frame of counts per mode in all species counts_table <- duplicates2counts(fungi_kaks |> classify_genes())  counts_table #>    type    n                   species #> 1    SD  683  saccharomyces_cerevisiae #> 2    TD   67  saccharomyces_cerevisiae #> 3    PD   70  saccharomyces_cerevisiae #> 4  rTRD    0  saccharomyces_cerevisiae #> 5  dTRD    0  saccharomyces_cerevisiae #> 6    DD 1790  saccharomyces_cerevisiae #> 7    SD   14          candida_glabrata #> 8    TD  104          candida_glabrata #> 9    PD   42          candida_glabrata #> 10 rTRD    0          candida_glabrata #> 11 dTRD    0          candida_glabrata #> 12   DD 1907          candida_glabrata #> 13   SD   53 schizosaccharomyces_pombe #> 14   TD   38 schizosaccharomyces_pombe #> 15   PD   48 schizosaccharomyces_pombe #> 16 rTRD    0 schizosaccharomyces_pombe #> 17 dTRD    0 schizosaccharomyces_pombe #> 18   DD 1853 schizosaccharomyces_pombe # A) Facets p1 <- plot_duplicate_freqs(counts_table)  # B) Stacked barplot, absolute frequencies p2 <- plot_duplicate_freqs(counts_table, plot_type = \"stack\")  # C) Stacked barplot, relative frequencies p3 <- plot_duplicate_freqs(counts_table, plot_type = \"stack_percent\")  # Combine plots, one per row patchwork::wrap_plots(p1, p2, p3, nrow = 3) +      patchwork::plot_annotation(tag_levels = \"A\") # Frequency of duplicated genes by mode classify_genes(fungi_kaks) |>   # classify genes into unique duplication types     duplicates2counts() |>      # get a data frame of counts (long format)     plot_duplicate_freqs()      # plot frequencies"},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-k_s-distributions","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing KsK_s distributions","title":"Identification and classification of duplicated genes","text":"briefly demonstrated , plot KsK_s distribution whole paranome, use function plot_ks_distro().  However, visualizing distribution whole paranome can mask patterns happen duplicates originating particular duplication types. instance, looking evidence WGD events, visualizing KsK_s distribution SD-derived pairs can reveal whether syntenic genes cluster together, suggesting presence WGD history. visualize distribution duplication type, use bytype = TRUE plot_ks_distro().","code":"ks_df <- fungi_kaks$saccharomyces_cerevisiae  # A) Histogram, whole paranome p1 <- plot_ks_distro(ks_df, plot_type = \"histogram\")  # B) Density, whole paranome p2 <- plot_ks_distro(ks_df, plot_type = \"density\")   # C) Histogram with density lines, whole paranome p3 <- plot_ks_distro(ks_df, plot_type = \"density_histogram\")  # Combine plots side by side patchwork::wrap_plots(p1, p2, p3, nrow = 1) +     patchwork::plot_annotation(tag_levels = \"A\") # A) Duplicates by type, histogram p1 <- plot_ks_distro(ks_df, bytype = TRUE, plot_type = \"histogram\")  # B) Duplicates by type, violin p2 <- plot_ks_distro(ks_df, bytype = TRUE, plot_type = \"violin\")  # Combine plots side by side patchwork::wrap_plots(p1, p2) +     patchwork::plot_annotation(tag_levels = \"A\")"},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-substitution-rates-by-species","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing substitution rates by species","title":"Identification and classification of duplicated genes","text":"function plot_rates_by_species() can used show distributions substitution rates (KsK_s, KaK_a, ratio Ka/KsK_a/K_s) species. can choose rate want visualize, whether group gene pairs duplication mode, demonstrated .","code":"# A) Ks for each species p1 <- plot_rates_by_species(fungi_kaks)  # B) Ka/Ks by duplication type for each species p2 <- plot_rates_by_species(fungi_kaks, rate_column = \"Ka_Ks\", bytype = TRUE)  # Combine plots - one per row patchwork::wrap_plots(p1, p2, nrow = 2) +     patchwork::plot_annotation(tag_levels = \"A\")"},{"path":"/articles/doubletrouble_vignette.html","id":"session-information","dir":"Articles","previous_headings":"","what":"Session information","title":"Identification and classification of duplicated genes","text":"document created following conditions:","code":"sessioninfo::session_info() #> ─ Session info ─────────────────────────────────────────────────────────────── #>  setting  value #>  version  R version 4.4.1 (2024-06-14) #>  os       Ubuntu 22.04.4 LTS #>  system   x86_64, linux-gnu #>  ui       X11 #>  language en #>  collate  en_US.UTF-8 #>  ctype    en_US.UTF-8 #>  tz       UTC #>  date     2024-07-25 #>  pandoc   3.2 @ /usr/bin/ (via rmarkdown) #>  #> ─ Packages ─────────────────────────────────────────────────────────────────── #>  package              * version   date (UTC) lib source #>  abind                  1.4-5     2016-07-21 [1] RSPM (R 4.4.0) #>  ade4                   1.7-22    2023-02-06 [1] RSPM (R 4.4.0) #>  AnnotationDbi        * 1.67.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  ape                    5.8       2024-04-11 [1] RSPM (R 4.4.0) #>  Biobase              * 2.65.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocFileCache          2.13.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocGenerics         * 0.51.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocIO                 1.15.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocManager            1.30.23   2024-05-04 [2] CRAN (R 4.4.1) #>  BiocParallel           1.39.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocStyle            * 2.33.1    2024-06-12 [1] Bioconductor 3.20 (R 4.4.0) #>  biomaRt                2.61.2    2024-06-24 [1] Bioconductor 3.20 (R 4.4.1) #>  Biostrings             2.73.1    2024-06-02 [1] Bioconductor 3.20 (R 4.4.0) #>  bit                    4.0.5     2022-11-15 [1] RSPM (R 4.4.0) #>  bit64                  4.0.5     2020-08-30 [1] RSPM (R 4.4.0) #>  bitops                 1.0-7     2021-04-24 [1] RSPM (R 4.4.0) #>  blob                   1.2.4     2023-03-17 [1] RSPM (R 4.4.0) #>  bookdown               0.40      2024-07-02 [1] RSPM (R 4.4.0) #>  bslib                  0.7.0     2024-03-29 [2] RSPM (R 4.4.0) #>  cachem                 1.1.0     2024-05-16 [2] RSPM (R 4.4.0) #>  cli                    3.6.3     2024-06-21 [2] RSPM (R 4.4.0) #>  coda                   0.19-4.1  2024-01-31 [1] RSPM (R 4.4.0) #>  codetools              0.2-20    2024-03-31 [3] CRAN (R 4.4.1) #>  colorspace             2.1-0     2023-01-23 [1] RSPM (R 4.4.0) #>  crayon                 1.5.3     2024-06-20 [2] RSPM (R 4.4.0) #>  curl                   5.2.1     2024-03-01 [2] RSPM (R 4.4.0) #>  DBI                    1.2.3     2024-06-02 [1] RSPM (R 4.4.0) #>  dbplyr                 2.5.0     2024-03-19 [1] RSPM (R 4.4.0) #>  DelayedArray           0.31.9    2024-07-17 [1] Bioconductor 3.20 (R 4.4.1) #>  desc                   1.4.3     2023-12-10 [2] RSPM (R 4.4.0) #>  digest                 0.6.36    2024-06-23 [2] RSPM (R 4.4.0) #>  doParallel             1.0.17    2022-02-07 [1] RSPM (R 4.4.0) #>  doubletrouble        * 1.5.1     2024-07-25 [1] Bioconductor #>  dplyr                  1.1.4     2023-11-17 [1] RSPM (R 4.4.0) #>  evaluate               0.24.0    2024-06-10 [2] RSPM (R 4.4.0) #>  fansi                  1.0.6     2023-12-08 [2] RSPM (R 4.4.0) #>  farver                 2.1.2     2024-05-13 [1] RSPM (R 4.4.0) #>  fastmap                1.2.0     2024-05-15 [2] RSPM (R 4.4.0) #>  feature                1.2.15    2021-02-10 [1] RSPM (R 4.4.0) #>  filelock               1.0.3     2023-12-11 [1] RSPM (R 4.4.0) #>  foreach                1.5.2     2022-02-02 [1] RSPM (R 4.4.0) #>  fs                     1.6.4     2024-04-25 [2] RSPM (R 4.4.0) #>  generics               0.1.3     2022-07-05 [1] RSPM (R 4.4.0) #>  GenomeInfoDb         * 1.41.1    2024-05-24 [1] Bioconductor 3.20 (R 4.4.0) #>  GenomeInfoDbData       1.2.12    2024-06-24 [1] Bioconductor #>  GenomicAlignments      1.41.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  GenomicFeatures      * 1.57.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  GenomicRanges        * 1.57.1    2024-06-12 [1] Bioconductor 3.20 (R 4.4.0) #>  ggnetwork              0.5.13    2024-02-14 [1] RSPM (R 4.4.0) #>  ggplot2                3.5.1     2024-04-23 [1] RSPM (R 4.4.0) #>  glue                   1.7.0     2024-01-09 [2] RSPM (R 4.4.0) #>  gtable                 0.3.5     2024-04-22 [1] RSPM (R 4.4.0) #>  highr                  0.11      2024-05-26 [2] RSPM (R 4.4.0) #>  hms                    1.1.3     2023-03-21 [1] RSPM (R 4.4.0) #>  htmltools              0.5.8.1   2024-04-04 [2] RSPM (R 4.4.0) #>  htmlwidgets            1.6.4     2023-12-06 [2] RSPM (R 4.4.0) #>  httr                   1.4.7     2023-08-15 [1] RSPM (R 4.4.0) #>  httr2                  1.0.2     2024-07-16 [2] RSPM (R 4.4.0) #>  igraph                 2.0.3     2024-03-13 [1] RSPM (R 4.4.0) #>  intergraph             2.0-4     2024-02-01 [1] RSPM (R 4.4.0) #>  IRanges              * 2.39.2    2024-07-17 [1] Bioconductor 3.20 (R 4.4.1) #>  iterators              1.0.14    2022-02-05 [1] RSPM (R 4.4.0) #>  jquerylib              0.1.4     2021-04-26 [2] RSPM (R 4.4.0) #>  jsonlite               1.8.8     2023-12-04 [2] RSPM (R 4.4.0) #>  KEGGREST               1.45.1    2024-06-17 [1] Bioconductor 3.20 (R 4.4.0) #>  KernSmooth             2.23-24   2024-05-17 [3] CRAN (R 4.4.1) #>  knitr                  1.48      2024-07-07 [2] RSPM (R 4.4.0) #>  ks                     1.14.2    2024-01-15 [1] RSPM (R 4.4.0) #>  labeling               0.4.3     2023-08-29 [1] RSPM (R 4.4.0) #>  lattice                0.22-6    2024-03-20 [3] CRAN (R 4.4.1) #>  lifecycle              1.0.4     2023-11-07 [2] RSPM (R 4.4.0) #>  magrittr               2.0.3     2022-03-30 [2] RSPM (R 4.4.0) #>  MASS                   7.3-61    2024-06-13 [2] RSPM (R 4.4.0) #>  Matrix                 1.7-0     2024-04-26 [3] CRAN (R 4.4.1) #>  MatrixGenerics         1.17.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  matrixStats            1.3.0     2024-04-11 [1] RSPM (R 4.4.0) #>  mclust                 6.1.1     2024-04-29 [1] RSPM (R 4.4.0) #>  memoise                2.0.1     2021-11-26 [2] RSPM (R 4.4.0) #>  MSA2dist               1.9.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  munsell                0.5.1     2024-04-01 [1] RSPM (R 4.4.0) #>  mvtnorm                1.2-5     2024-05-21 [1] RSPM (R 4.4.0) #>  network                1.18.2    2023-12-05 [1] RSPM (R 4.4.0) #>  networkD3              0.4       2017-03-18 [1] RSPM (R 4.4.0) #>  nlme                   3.1-165   2024-06-06 [2] RSPM (R 4.4.0) #>  patchwork              1.2.0     2024-01-08 [1] RSPM (R 4.4.0) #>  pheatmap               1.0.12    2019-01-04 [1] RSPM (R 4.4.0) #>  pillar                 1.9.0     2023-03-22 [2] RSPM (R 4.4.0) #>  pkgconfig              2.0.3     2019-09-22 [2] RSPM (R 4.4.0) #>  pkgdown                2.1.0     2024-07-06 [2] RSPM (R 4.4.0) #>  png                    0.1-8     2022-11-29 [1] RSPM (R 4.4.0) #>  pracma                 2.4.4     2023-11-10 [1] RSPM (R 4.4.0) #>  prettyunits            1.2.0     2023-09-24 [2] RSPM (R 4.4.0) #>  progress               1.2.3     2023-12-06 [1] RSPM (R 4.4.0) #>  purrr                  1.0.2     2023-08-10 [2] RSPM (R 4.4.0) #>  pwalign                1.1.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  R6                     2.5.1     2021-08-19 [2] RSPM (R 4.4.0) #>  ragg                   1.3.2     2024-05-15 [2] RSPM (R 4.4.0) #>  rappdirs               0.3.3     2021-01-31 [2] RSPM (R 4.4.0) #>  RColorBrewer           1.1-3     2022-04-03 [1] RSPM (R 4.4.0) #>  Rcpp                   1.0.13    2024-07-17 [2] RSPM (R 4.4.0) #>  RCurl                  1.98-1.16 2024-07-11 [1] RSPM (R 4.4.0) #>  restfulr               0.0.15    2022-06-16 [1] RSPM (R 4.4.0) #>  rjson                  0.2.21    2022-01-09 [1] RSPM (R 4.4.0) #>  rlang                  1.1.4     2024-06-04 [2] RSPM (R 4.4.0) #>  rmarkdown              2.27      2024-05-17 [2] RSPM (R 4.4.0) #>  Rsamtools              2.21.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  RSQLite                2.3.7     2024-05-27 [1] RSPM (R 4.4.0) #>  rtracklayer            1.65.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  S4Arrays               1.5.5     2024-07-21 [1] Bioconductor 3.20 (R 4.4.1) #>  S4Vectors            * 0.43.2    2024-07-17 [1] Bioconductor 3.20 (R 4.4.1) #>  sass                   0.4.9     2024-03-15 [2] RSPM (R 4.4.0) #>  scales                 1.3.0     2023-11-28 [1] RSPM (R 4.4.0) #>  seqinr                 4.2-36    2023-12-08 [1] RSPM (R 4.4.0) #>  sessioninfo            1.2.2     2021-12-06 [2] RSPM (R 4.4.0) #>  SparseArray            1.5.25    2024-07-21 [1] Bioconductor 3.20 (R 4.4.1) #>  statnet.common         4.9.0     2023-05-24 [1] RSPM (R 4.4.0) #>  stringi                1.8.4     2024-05-06 [2] RSPM (R 4.4.0) #>  stringr                1.5.1     2023-11-14 [2] RSPM (R 4.4.0) #>  SummarizedExperiment   1.35.1    2024-06-28 [1] Bioconductor 3.20 (R 4.4.1) #>  syntenet             * 1.7.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  systemfonts            1.1.0     2024-05-15 [2] RSPM (R 4.4.0) #>  textshaping            0.4.0     2024-05-24 [2] RSPM (R 4.4.0) #>  tibble                 3.2.1     2023-03-20 [2] RSPM (R 4.4.0) #>  tidyr                  1.3.1     2024-01-24 [1] RSPM (R 4.4.0) #>  tidyselect             1.2.1     2024-03-11 [1] RSPM (R 4.4.0) #>  txdbmaker            * 1.1.1     2024-06-20 [1] Bioconductor 3.20 (R 4.4.0) #>  UCSC.utils             1.1.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  utf8                   1.2.4     2023-10-22 [2] RSPM (R 4.4.0) #>  vctrs                  0.6.5     2023-12-01 [2] RSPM (R 4.4.0) #>  withr                  3.0.0     2024-01-16 [2] RSPM (R 4.4.0) #>  xfun                   0.46      2024-07-18 [2] RSPM (R 4.4.0) #>  XML                    3.99-0.17 2024-06-25 [1] RSPM (R 4.4.0) #>  xml2                   1.3.6     2023-12-04 [2] RSPM (R 4.4.0) #>  XVector                0.45.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  yaml                   2.3.9     2024-07-05 [2] RSPM (R 4.4.0) #>  zlibbioc               1.51.1    2024-06-05 [1] Bioconductor 3.20 (R 4.4.0) #>  #>  [1] /__w/_temp/Library #>  [2] /usr/local/lib/R/site-library #>  [3] /usr/local/lib/R/library #>  #> ──────────────────────────────────────────────────────────────────────────────"},{"path":[]},{"path":"/authors.html","id":null,"dir":"","previous_headings":"","what":"Authors","title":"Authors and Citation","text":"Fabrício Almeida-Silva. Author, maintainer. Yves Van de Peer. Author.","code":""},{"path":"/authors.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Authors and Citation","text":"Almeida-Silva F, Van de Peer Y (2024). doubletrouble: Identification classification duplicated genes. R package version 1.5.1, https://github.com/almeidasilvaf/doubletrouble.","code":"@Manual{,   title = {doubletrouble: Identification and classification of duplicated genes},   author = {Fabrício Almeida-Silva and Yves {Van de Peer}},   year = {2024},   note = {R package version 1.5.1},   url = {https://github.com/almeidasilvaf/doubletrouble}, }"},{"path":"/index.html","id":"doubletrouble-","dir":"","previous_headings":"","what":"Identification and classification of duplicated genes","title":"Identification and classification of duplicated genes","text":"major goal doubletrouble identify duplicated genes whole-genome protein sequences classify based modes duplication. Duplicates can classified using four different classification schemes, increase complexity level details stepwise manner. classification schemes duplication modes can classify : Legend: SD, segmental duplication. SSD, small-scale duplication. TD, tandem duplication. PD, proximal duplication. TRD, transposon-derived duplication. rTRD, retrotransposon-derived duplication. dTRD, DNA transposon-derived duplication. DD, dispersed duplication. Besides classifying gene pairs, users can also classify genes, gene assigned unique mode duplication. Users can also calculate substitution rates per substitution site (.e., KaK_a, KsK_s ratios KaKs\\frac{K_a}{K_s}) duplicate pairs, find peaks Ks distributions Gaussian Mixture Models (GMMs), classify gene pairs age groups based Ks peaks.","code":""},{"path":"/index.html","id":"installation-instructions","dir":"","previous_headings":"","what":"Installation instructions","title":"Identification and classification of duplicated genes","text":"Get latest stable R release CRAN. install doubletrouble Bioconductor using following code: development version GitHub :","code":"if (!requireNamespace(\"BiocManager\", quietly = TRUE)) {     install.packages(\"BiocManager\") }  BiocManager::install(\"doubletrouble\") BiocManager::install(\"almeidasilvaf/doubletrouble\")"},{"path":"/index.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Identification and classification of duplicated genes","text":"citation output using citation('doubletrouble') R. Please run check updates cite doubletrouble. Please note doubletrouble made possible thanks many R bioinformatics software authors, cited either vignettes /paper(s) describing package.","code":"print(citation('doubletrouble'), bibtex = TRUE) #> To cite package 'doubletrouble' in publications use: #>  #>   Almeida-Silva F, Van de Peer Y (2022). _doubletrouble: Identification #>   and classification of duplicated genes_. R package version 1.3.0, #>   <https://github.com/almeidasilvaf/doubletrouble>. #>  #> A BibTeX entry for LaTeX users is #>  #>   @Manual{, #>     title = {doubletrouble: Identification and classification of duplicated genes}, #>     author = {Fabrício Almeida-Silva and Yves {Van de Peer}}, #>     year = {2022}, #>     note = {R package version 1.3.0}, #>     url = {https://github.com/almeidasilvaf/doubletrouble}, #>   }"},{"path":"/index.html","id":"code-of-conduct","dir":"","previous_headings":"","what":"Code of Conduct","title":"Identification and classification of duplicated genes","text":"Please note doubletrouble project released Contributor Code Conduct. contributing project, agree abide terms.","code":""},{"path":"/index.html","id":"development-tools","dir":"","previous_headings":"","what":"Development tools","title":"Identification and classification of duplicated genes","text":"Continuous code testing possible thanks GitHub actions usethis, remotes, rcmdcheck customized use Bioconductor’s docker containers BiocCheck. Code coverage assessment possible thanks codecov covr. documentation website automatically updated thanks pkgdown. code styled automatically thanks styler. documentation formatted thanks devtools roxygen2. details, check dev directory. package developed using biocthis.","code":""},{"path":"/reference/cds_scerevisiae.html","id":null,"dir":"Reference","previous_headings":"","what":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"Data obtained Ensembl Fungi, CDS primary transcripts included.","code":""},{"path":"/reference/cds_scerevisiae.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"","code":"data(cds_scerevisiae)"},{"path":"/reference/cds_scerevisiae.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"DNAStringSet object CDS S. cerevisiae.","code":""},{"path":"/reference/cds_scerevisiae.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"","code":"data(cds_scerevisiae)"},{"path":"/reference/classify_gene_pairs.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"Classify duplicate gene pairs based modes duplication","code":""},{"path":"/reference/classify_gene_pairs.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"","code":"classify_gene_pairs(   annotation = NULL,   blast_list = NULL,   scheme = \"standard\",   blast_inter = NULL,   intron_counts,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   proximal_max = 10,   collinearity_dir = NULL )"},{"path":"/reference/classify_gene_pairs.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). blast_list list data frames containing BLAST tabular output intraspecies comparisons. list element corresponds BLAST output given species, names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). scheme Character indicating classification scheme use. One \"binary\", \"standard\", \"extended\", \"full\". See details information scheme means. Default: \"standard\". blast_inter (valid scheme == \"extended\" \"full\"). list data frames containing BLAST tabular output comparison target species outgroups. Names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). intron_counts (valid scheme == \"full\"). list 2-column data frames number introns per gene returned get_intron_counts(). Names list elements must match names annotation. evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. proximal_max Numeric scalar maximum distance (number genes) two genes consider proximal duplicates. Default: 10. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/classify_gene_pairs.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"list 3-column data frames duplicated gene pairs (columns 1 2), modes duplication (column 3).","code":""},{"path":"/reference/classify_gene_pairs.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"classification schemes increase complexity (number classes) order 'binary', 'standard', 'extended', 'full'. classification scheme \"binary\", duplicates classified one 'SD' (segmental duplications) 'SSD' (small-scale duplications). classification scheme \"standard\" (default), duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'DD' (dispersed duplication). classification scheme \"extended\", duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'TRD' (transposon-derived duplication), 'DD' (dispersed duplication). Finally, classification scheme \"full\", duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'rTRD' (retrotransposon-derived duplication), 'dTRD' (DNA transposon-derived duplication), 'DD' (dispersed duplication).","code":""},{"path":"/reference/classify_gene_pairs.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"","code":"# Load example data data(diamond_intra) data(diamond_inter) data(yeast_annot) data(yeast_seq)  # Get processed annotation data annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation  # Get list of intron counts library(txdbmaker) #> Loading required package: BiocGenerics #>  #> Attaching package: ‘BiocGenerics’ #> The following objects are masked from ‘package:stats’: #>  #>     IQR, mad, sd, var, xtabs #> The following objects are masked from ‘package:base’: #>  #>     Filter, Find, Map, Position, Reduce, anyDuplicated, aperm, append, #>     as.data.frame, basename, cbind, colnames, dirname, do.call, #>     duplicated, eval, evalq, get, grep, grepl, intersect, is.unsorted, #>     lapply, mapply, match, mget, order, paste, pmax, pmax.int, pmin, #>     pmin.int, rank, rbind, rownames, sapply, setdiff, table, tapply, #>     union, unique, unsplit, which.max, which.min #> Loading required package: S4Vectors #> Loading required package: stats4 #>  #> Attaching package: ‘S4Vectors’ #> The following object is masked from ‘package:utils’: #>  #>     findMatches #> The following objects are masked from ‘package:base’: #>  #>     I, expand.grid, unname #> Loading required package: GenomeInfoDb #> Loading required package: IRanges #> Loading required package: GenomicRanges #> Loading required package: GenomicFeatures #> Loading required package: AnnotationDbi #> Loading required package: Biobase #> Welcome to Bioconductor #>  #>     Vignettes contain introductory material; view with #>     'browseVignettes()'. To cite Bioconductor, see #>     'citation(\"Biobase\")', and for packages 'citation(\"pkgname\")'. #>  #> Attaching package: ‘txdbmaker’ #> The following objects are masked from ‘package:GenomicFeatures’: #>  #>     UCSCFeatureDbTableSchema, browseUCSCtrack, getChromInfoFromBiomart, #>     makeFDbPackageFromUCSC, makeFeatureDbFromUCSC, makePackageName, #>     makeTxDb, makeTxDbFromBiomart, makeTxDbFromEnsembl, #>     makeTxDbFromGFF, makeTxDbFromGRanges, makeTxDbFromUCSC, #>     makeTxDbPackage, makeTxDbPackageFromBiomart, #>     makeTxDbPackageFromUCSC, supportedMiRBaseBuildValues, #>     supportedUCSCFeatureDbTables, supportedUCSCFeatureDbTracks, #>     supportedUCSCtables txdb_list <- lapply(yeast_annot, txdbmaker::makeTxDbFromGRanges) intron_counts <- lapply(txdb_list, get_intron_counts)  # Classify duplicates - full scheme dup_class <- classify_gene_pairs(     annotation = annotation,      blast_list = diamond_intra,      scheme = \"full\",     blast_inter = diamond_inter,      intron_counts = intron_counts )  # Check number of gene pairs per class table(dup_class$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  342   42   80   52  963 2109"},{"path":"/reference/classify_genes.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify genes into unique modes of duplication — classify_genes","title":"Classify genes into unique modes of duplication — classify_genes","text":"Classify genes unique modes duplication","code":""},{"path":"/reference/classify_genes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify genes into unique modes of duplication — classify_genes","text":"","code":"classify_genes(gene_pairs_list = NULL)"},{"path":"/reference/classify_genes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify genes into unique modes of duplication — classify_genes","text":"gene_pairs_list List classified gene pairs returned classify_gene_pairs().","code":""},{"path":"/reference/classify_genes.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify genes into unique modes of duplication — classify_genes","text":"list 2-column data frames variables gene type representing gene ID duplication type, respectively.","code":""},{"path":"/reference/classify_genes.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Classify genes into unique modes of duplication — classify_genes","text":"gene present pairs different duplication modes, gene classified unique mode duplication following order priority indicated levels factor type. scheme \"binary\", order SD > SSD. scheme \"standard\", order SD > TD > PD > DD. scheme \"extended\", order SD > TD > PD > TRD > DD. scheme \"full\", order SD > TD > PD > rTRD > dTRD > DD.","code":""},{"path":"/reference/classify_genes.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify genes into unique modes of duplication — classify_genes","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  cols <- c(\"dup1\", \"dup2\", \"type\") gene_pairs_list <- list(Scerevisiae = scerevisiae_kaks[, cols])  class_genes <- classify_genes(gene_pairs_list)"},{"path":"/reference/diamond_inter.html","id":null,"dir":"Reference","previous_headings":"","what":"Interspecies DIAMOND output for yeast species — diamond_inter","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"list contains similarity search S. cerevisiae C. glabrata, obtained run_diamond().","code":""},{"path":"/reference/diamond_inter.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"","code":"data(diamond_inter)"},{"path":"/reference/diamond_inter.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"list data frames (length 1) containing output DIAMOND search S. cerevisiae C. glabrata (outgroup).","code":""},{"path":"/reference/diamond_inter.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"","code":"data(diamond_inter)"},{"path":"/reference/diamond_intra.html","id":null,"dir":"Reference","previous_headings":"","what":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"List obtained run_diamond().","code":""},{"path":"/reference/diamond_intra.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"","code":"data(diamond_intra)"},{"path":"/reference/diamond_intra.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"list data frames (length 1) containing whole paranome S. cerevisiae resulting intragenome similarity searches.","code":""},{"path":"/reference/diamond_intra.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"","code":"data(diamond_intra)"},{"path":"/reference/duplicates2counts.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a duplicate count matrix for each genome — duplicates2counts","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"Get duplicate count matrix genome","code":""},{"path":"/reference/duplicates2counts.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"","code":"duplicates2counts(duplicate_list, shape = \"long\")"},{"path":"/reference/duplicates2counts.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"duplicate_list list data frames duplicated genes gene pairs modes duplication returned classify_gene_pairs() classify_genes(). shape Character specifying shape output data frame. One \"long\" (data frame long shape, tidyverse sense), \"wide\" (data frame wide shape, tidyverse sense). Default: \"long\".","code":""},{"path":"/reference/duplicates2counts.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"shape = \"wide\", count matrix containing frequency duplicated genes (gene pairs) mode species, species rows duplication modes columns. shape = \"long\", data frame long format following variables: type Factor, type duplication. n Numeric, number duplicates. species Character, species name","code":""},{"path":"/reference/duplicates2counts.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"","code":"data(fungi_kaks)  # Get unique duplicates duplicate_list <- classify_genes(fungi_kaks)  # Get count table counts <- duplicates2counts(duplicate_list)"},{"path":"/reference/find_ks_peaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"Find peaks Ks distribution Gaussian Mixture Models","code":""},{"path":"/reference/find_ks_peaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"","code":"find_ks_peaks(ks, npeaks = 2, min_ks = 0.01, max_ks = 4, verbose = FALSE)"},{"path":"/reference/find_ks_peaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"ks numeric vector Ks values. npeaks Numeric scalar indicating number peaks Ks distribution. know many peaks , can include range values, number peaks produces lowest BIC (Bayesian Information Criterion) selected optimal. Default: 2. min_ks Numeric scalar minimum Ks value. Removing small Ks values generally used avoid incorporation allelic /splice variants prevent fitting component infinity. Default: 0.01. max_ks Numeric scalar indicating maximum Ks value. Removing large Ks values usually performed account Ks saturation. Default: 4. verbose Logical indicating messages printed screen. Default: FALSE.","code":""},{"path":"/reference/find_ks_peaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"list following elements: mean Numeric estimated means. sd Numeric estimated standard deviations. lambda Numeric estimated mixture weights. ks Numeric vector filtered Ks distribution based arguments passed min_ks max_ks.","code":""},{"path":"/reference/find_ks_peaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae ks <- scerevisiae_kaks$Ks  # Find 2 peaks in Ks distribution peaks <- find_ks_peaks(ks, npeaks = 2)  # From 2 to 4 peaks, verbose = TRUE to show BIC values peaks <- find_ks_peaks(ks, npeaks = c(2, 3, 4), verbose = TRUE) #> Optimal number of peaks: 4 #> Bayesian Information Criterion (BIC):  #>           E         V #> 2 -4833.369 -4312.906 #> 3 -4109.263 -3625.427 #> 4 -4124.051 -3397.111 #>  #> Top 3 models based on the BIC criterion:  #>       V,4       V,3       E,3  #> -3397.111 -3625.427 -4109.263"},{"path":"/reference/fungi_kaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"data set obtained classify_gene_pairs() followed pairs2kaks().","code":""},{"path":"/reference/fungi_kaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"","code":"data(fungi_kaks)"},{"path":"/reference/fungi_kaks.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"list data frame elements named saccharomyces_cerevisiae, candida_glabrata, schizosaccharomyces_pombe. data frame contains following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. Ka Numeric, Ka values. Ks Numeric, Ks values. Ka_Ks Numeric, Ka/Ks values. type Character, mode duplication","code":""},{"path":"/reference/fungi_kaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"","code":"data(fungi_kaks)"},{"path":"/reference/get_anchors_list.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a list of anchor pairs for each species — get_anchors_list","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"Get list anchor pairs species","code":""},{"path":"/reference/get_anchors_list.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"","code":"get_anchors_list(   blast_list = NULL,   annotation = NULL,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   collinearity_dir = NULL )"},{"path":"/reference/get_anchors_list.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"blast_list list data frames containing BLAST tabular output intraspecies comparisons. list element corresponds BLAST output given species, names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/get_anchors_list.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"list data frames representing intraspecies anchor pairs.","code":""},{"path":"/reference/get_anchors_list.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"","code":"data(diamond_intra) data(yeast_annot) data(yeast_seq) blast_list <- diamond_intra  # Get processed annotation for S. cerevisiae annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation  # Get list of intraspecies anchor pairs anchorpairs <- get_anchors_list(blast_list, annotation)"},{"path":"/reference/get_intron_counts.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a data frame of intron counts per gene — get_intron_counts","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"Get data frame intron counts per gene","code":""},{"path":"/reference/get_intron_counts.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"","code":"get_intron_counts(txdb)"},{"path":"/reference/get_intron_counts.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"txdb TxDb object transcript annotations. See details examples create TxDb objects different kinds input.","code":""},{"path":"/reference/get_intron_counts.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"data frame intron counts per gene, variables: gene Character gene IDs. introns Numeric number introns per gene.","code":""},{"path":"/reference/get_intron_counts.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"family functions makeTxDbFrom* txdbmaker package can used create TxDb objects variety input data types. can create TxDb objects e.g., GRanges objects (makeTxDbFromGRanges()), GFF files (makeTxDbFromGFF()), Ensembl database (makeTxDbFromEnsembl), Biomart database (makeTxDbFromBiomart).","code":""},{"path":"/reference/get_intron_counts.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"","code":"data(yeast_annot)  # Create TxDb object from GRanges library(txdbmaker) txdb <- txdbmaker::makeTxDbFromGRanges(yeast_annot[[1]])  # Get intron counts intron_counts <- get_intron_counts(txdb)"},{"path":"/reference/get_segmental.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs derived from segmental duplications — get_segmental","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"Classify gene pairs derived segmental duplications","code":""},{"path":"/reference/get_segmental.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"","code":"get_segmental(anchor_pairs = NULL, pairs = NULL)"},{"path":"/reference/get_segmental.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"anchor_pairs 2-column data frame anchor pairs columns 1 2. pairs 2-column data frame duplicate pairs. equivalent first 2 columns tabular output BLAST-like programs.","code":""},{"path":"/reference/get_segmental.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"3-column data frame variables: dup1 Character, duplicated gene 1 dup2 Character, duplicated gene 2 type Factor indicating duplication types, levels \"SD\" (segmental duplication) \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_segmental.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"","code":"data(diamond_intra) data(yeast_annot) data(yeast_seq) blast_list <- diamond_intra  # Get processed annotation for S. cerevisiae annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation[1]  # Get list of intraspecies anchor pairs anchor_pairs <- get_anchors_list(blast_list, annotation) anchor_pairs <- anchor_pairs[[1]][, c(1, 2)]  # Get duplicate pairs from DIAMOND output duplicates <- diamond_intra[[1]][, c(1, 2)] dups <- get_segmental(anchor_pairs, duplicates)"},{"path":"/reference/get_tandem_proximal.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"Classify gene pairs derived tandem proximal duplications","code":""},{"path":"/reference/get_tandem_proximal.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"","code":"get_tandem_proximal(pairs = NULL, annotation_granges = NULL, proximal_max = 10)"},{"path":"/reference/get_tandem_proximal.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_segmental(). annotation_granges processed GRanges object element list returned syntenet::process_input(). proximal_max Numeric scalar maximum distance (number genes) two genes consider proximal duplicates. Default: 10.","code":""},{"path":"/reference/get_tandem_proximal.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"3-column data frame variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_tandem_proximal.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"","code":"data(yeast_annot) data(yeast_seq) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation for S. cerevisiae pdata <- annotation <- syntenet::process_input(yeast_seq, yeast_annot) annot <- pdata$annotation[[1]]  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Get tandem and proximal duplicates td_pd_pairs <- get_tandem_proximal(pairs, annot)"},{"path":"/reference/get_transposed.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs originating from transposon-derived duplications — get_transposed","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"Classify gene pairs originating transposon-derived duplications","code":""},{"path":"/reference/get_transposed.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"","code":"get_transposed(   pairs,   blast_inter,   annotation,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   collinearity_dir = NULL )"},{"path":"/reference/get_transposed.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_tandem_proximal(). blast_inter list data frames length 1 containing BLAST tabular output comparison target species outgroup. Names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned syntenet::process_input(). annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/get_transposed.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"3-column data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"TRD\" (transposon-derived duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_transposed.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"","code":"data(diamond_inter) data(diamond_intra) data(yeast_seq) data(yeast_annot) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation pdata <- syntenet::process_input(yeast_seq, yeast_annot) annotation <- pdata$annotation  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Classify pairs trd <- get_transposed(pairs, diamond_inter, annotation)"},{"path":"/reference/get_transposed_classes.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"Classify TRD genes derived either DNA transposons retrotransposons","code":""},{"path":"/reference/get_transposed_classes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"","code":"get_transposed_classes(pairs, intron_counts)"},{"path":"/reference/get_transposed_classes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_transposed(). intron_counts 2-column data frame columns gene introns indicating number introns gene, returned get_intron_counts.","code":""},{"path":"/reference/get_transposed_classes.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"3-column data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"dTRD\" (DNA transposon-derived duplication), \"rTRD\" (retrotransposon-derived duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_transposed_classes.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"","code":"data(diamond_inter) data(diamond_intra) data(yeast_seq) data(yeast_annot) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation pdata <- syntenet::process_input(yeast_seq, yeast_annot) annotation <- pdata$annotation  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Classify pairs trd <- get_transposed(pairs, diamond_inter, annotation)  # Create TxDb object from GRanges library(txdbmaker) txdb <- txdbmaker::makeTxDbFromGRanges(yeast_annot[[1]])  # Get intron counts intron_counts <- get_intron_counts(txdb)  # Get TRD classes trd_classes <- get_transposed_classes(trd, intron_counts)"},{"path":"/reference/gmax_ks.html","id":null,"dir":"Reference","previous_headings":"","what":"Duplicate pairs and Ks values for Glycine max — gmax_ks","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"data set obtained classify_gene_pairs() followed pairs2kaks().","code":""},{"path":"/reference/gmax_ks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"","code":"data(gmax_ks)"},{"path":"/reference/gmax_ks.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. Ks Numeric, Ks values.","code":""},{"path":"/reference/gmax_ks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"","code":"data(gmax_ks)"},{"path":"/reference/pairs2kaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"Calculate Ka, Ks, Ka/Ks duplicate gene pairs","code":""},{"path":"/reference/pairs2kaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"","code":"pairs2kaks(gene_pairs_list, cds, model = \"MYN\", threads = 1)"},{"path":"/reference/pairs2kaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"gene_pairs_list List data frames containing duplicated gene pairs returned classify_gene_pairs(). cds List DNAStringSet objects containing coding sequences gene. model Character scalar indicating codon model use. Possible values \"Li\", \"NG86\", \"NG\", \"LWL\", \"LPB\", \"MLWL\", \"MLPB\", \"GY\", \"YN\", \"MYN\", \"MS\", \"MA\", \"GNG\", \"GLWL\", \"GLPB\", \"GMLWL\", \"GMLPB\", \"GYN\", \"GMYN\". Default: \"MYN\". threads Numeric indicating number threads use. Default: 1.","code":""},{"path":"/reference/pairs2kaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"list data frames containing gene pairs Ka, Ks, Ka/Ks values.","code":""},{"path":"/reference/pairs2kaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"","code":"data(diamond_intra) data(diamond_inter) data(yeast_annot) data(yeast_seq) data(cds_scerevisiae) blast_list <- diamond_intra blast_inter <- diamond_inter  pdata <- syntenet::process_input(yeast_seq, yeast_annot) annot <- pdata$annotation[\"Scerevisiae\"]  # Binary classification scheme pairs <- classify_gene_pairs(annot, blast_list) td_pairs <- pairs[[1]][pairs[[1]]$type == \"TD\", ] gene_pairs_list <- list(     Scerevisiae = td_pairs[seq(1, 3, by = 1), ] )  cds <- list(Scerevisiae = cds_scerevisiae)  kaks <- pairs2kaks(gene_pairs_list, cds)"},{"path":"/reference/plot_duplicate_freqs.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"Plot frequency duplicates per mode species","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"","code":"plot_duplicate_freqs(dup_counts, plot_type = \"facet\", remove_zero = TRUE)"},{"path":"/reference/plot_duplicate_freqs.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"dup_counts data frame long format number duplicates per mode species, returned function duplicates2counts. plot_type Character indicating plot frequencies. One 'facet' (facets level variable type), 'stack' (levels variable type stacked bars), 'stack_percent' (levels variable type stacked bars, x-axis representing relative frequencies). Default: 'facet'. remove_zero Logical indicating whether remove rows zero values. Default: TRUE.","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"ggplot object.","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"","code":"data(fungi_kaks)  # Get unique duplicates duplicate_list <- classify_genes(fungi_kaks)  # Get count table dup_counts <- duplicates2counts(duplicate_list)  # Plot counts plot_duplicate_freqs(dup_counts, plot_type = \"stack_percent\")"},{"path":"/reference/plot_ks_distro.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"Plot distribution synonymous substitution rates (Ks)","code":""},{"path":"/reference/plot_ks_distro.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"","code":"plot_ks_distro(   ks_df,   min_ks = 0.01,   max_ks = 2,   bytype = FALSE,   type_levels = NULL,   plot_type = \"histogram\",   binwidth = 0.03 )"},{"path":"/reference/plot_ks_distro.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"ks_df data frame Ks values gene pair returned pairs2kaks(). min_ks Numeric indicating minimum Ks value keep. Default: 0.01. max_ks Numeric indicating maximum Ks value keep. Default: 2. bytype Logical indicating whether plot distribution type duplication (requires column named type). type_levels (valid bytype NULL) Character indicating levels variable specified parameter group_by kept. default, levels kept. plot_type Character indicating type plot create. bytype = TRUE, possible types \"histogram\" \"violin\". bytype = FALSE, possible types \"histogram\", \"density\", \"density_histogram\". Default: \"histogram\". binwidth (valid plot_type = \"histogram\") Numeric indicating bin width. Default: 0.03.","code":""},{"path":"/reference/plot_ks_distro.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"ggplot object.","code":""},{"path":"/reference/plot_ks_distro.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"","code":"data(fungi_kaks) ks_df <- fungi_kaks$saccharomyces_cerevisiae  # Plot distro plot_ks_distro(ks_df, bytype = TRUE)"},{"path":"/reference/plot_ks_peaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"Plot histogram Ks distribution peaks","code":""},{"path":"/reference/plot_ks_peaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"","code":"plot_ks_peaks(peaks = NULL, binwidth = 0.05)"},{"path":"/reference/plot_ks_peaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"peaks list elements mean, sd, lambda, ks, returned function fins_ks_peaks(). binwidth Numeric scalar binwidth histogram. Default: 0.05.","code":""},{"path":"/reference/plot_ks_peaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"ggplot object histogram lines Ks peak.","code":""},{"path":"/reference/plot_ks_peaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae ks <- scerevisiae_kaks$Ks  # Find 2 peaks in Ks distribution peaks <- find_ks_peaks(ks, npeaks = 2)  # Plot plot_ks_peaks(peaks, binwidth = 0.05)"},{"path":"/reference/plot_rates_by_species.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"Plot distributions substitution rates (Ka, Ks, Ka/Ks) per species","code":""},{"path":"/reference/plot_rates_by_species.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"","code":"plot_rates_by_species(   kaks_list,   rate_column = \"Ks\",   bytype = FALSE,   range = c(0, 2),   fill = \"deepskyblue3\",   color = \"deepskyblue4\" )"},{"path":"/reference/plot_rates_by_species.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"kaks_list list data frames substitution rates per gene pair species returned pairs2kaks(). rate_column Character indicating name column plot. Default: \"Ks\". bytype Logical indicating whether show distributions type duplication. Default: FALSE. range Numeric vector length 2 indicating minimum maximum values plot. Default: c(0, 2). fill Character color use fill aesthetic. Ignored bytype = TRUE. Default: \"deepskyblue3\". color Character color use color aesthetic. Ignored bytype = FALSE. Default: \"deepskyblue4\".","code":""},{"path":"/reference/plot_rates_by_species.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"ggplot object.","code":""},{"path":"/reference/plot_rates_by_species.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"Data plotted using species order list. change order species plot, reorder list elements kaks_list.","code":""},{"path":"/reference/plot_rates_by_species.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"","code":"data(fungi_kaks)  # Plot rates plot_rates_by_species(fungi_kaks, rate_column = \"Ka_Ks\")"},{"path":"/reference/split_pairs_by_peak.html","id":null,"dir":"Reference","previous_headings":"","what":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"purpose function classify gene pairs age 2+ Ks peaks. way, newer gene pairs found within certain number standard deviations highest peak, older genes found close within smaller peaks.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"","code":"split_pairs_by_peak(ks_df, peaks, nsd = 2, binwidth = 0.05)"},{"path":"/reference/split_pairs_by_peak.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"ks_df 3-column data frame gene pairs columns 1 2, Ks values gene pair column 3. peaks list mean, standard deviation, amplitude Ks peaks generated find_ks_peaks. nsd Numeric number standard deviations consider peak. binwidth Numeric scalar binwidth histogram. Default: 0.05.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"list following elements: pairs 4-column data frame variables dup1 (character), dup2 (character), ks (numeric), peak (numeric), representing duplicate gene pair, Ks values, peak ID, respectively. plot ggplot object Ks peaks returned plot_ks_peaks, dashed red lines indicating boundaries peak.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Create a data frame of duplicate pairs and Ks values ks_df <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"Ks\")]  # Create list of peaks peaks <- find_ks_peaks(ks_df$Ks, npeaks = 2)  # Split pairs spairs <- split_pairs_by_peak(ks_df, peaks)"},{"path":"/reference/yeast_annot.html","id":null,"dir":"Reference","previous_headings":"","what":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"Data obtained Ensembl Fungi. annotation data protein-coding genes (associated mRNA, exons, CDS, etc) included.","code":""},{"path":"/reference/yeast_annot.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"","code":"data(yeast_annot)"},{"path":"/reference/yeast_annot.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"CompressedGRangesList containing elements Scerevisiae Cglabrata.","code":""},{"path":"/reference/yeast_annot.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"","code":"data(yeast_annot)"},{"path":"/reference/yeast_seq.html","id":null,"dir":"Reference","previous_headings":"","what":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"Data obtained Ensembl Fungi. translated sequences primary transcripts included.","code":""},{"path":"/reference/yeast_seq.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"","code":"data(yeast_seq)"},{"path":"/reference/yeast_seq.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"list AAStringSet objects elements Scerevisiae Cglabrata.","code":""},{"path":"/reference/yeast_seq.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"","code":"data(yeast_seq)"},{"path":"/news/index.html","id":"doubletrouble-0990","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.0","title":"doubletrouble 0.99.0","text":"NEW FEATURES Added NEWS.md file track changes package.","code":""},{"path":"/news/index.html","id":"doubletrouble-0992","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.2","title":"doubletrouble 0.99.2","text":"CHANGES Small change coding style Bioconductor peer-review (m:n replaced c(m, n) seq(m,n))","code":""},{"path":"/news/index.html","id":"doubletrouble-0993","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.3","title":"doubletrouble 0.99.3","text":"BUG FIXES Updated functions (e.g., get_anchor_list(), collinearity2blocks()) update syntenet.","code":""}]
+[{"path":"/CONTRIBUTING.html","id":null,"dir":"","previous_headings":"","what":"Contributing to doubletrouble","title":"Contributing to doubletrouble","text":"outlines propose change doubletrouble. detailed info contributing , tidyverse packages, please see development contributing guide.","code":""},{"path":"/CONTRIBUTING.html","id":"fixing-typos","dir":"","previous_headings":"","what":"Fixing typos","title":"Contributing to doubletrouble","text":"can fix typos, spelling mistakes, grammatical errors documentation directly using GitHub web interface, long changes made source file. generally means ’ll need edit roxygen2 comments .R, .Rd file. can find .R file generates .Rd reading comment first line.","code":""},{"path":"/CONTRIBUTING.html","id":"bigger-changes","dir":"","previous_headings":"","what":"Bigger changes","title":"Contributing to doubletrouble","text":"want make bigger change, ’s good idea first file issue make sure someone team agrees ’s needed. ’ve found bug, please file issue illustrates bug minimal reprex (also help write unit test, needed).","code":""},{"path":"/CONTRIBUTING.html","id":"pull-request-process","dir":"","previous_headings":"Bigger changes","what":"Pull request process","title":"Contributing to doubletrouble","text":"Fork package clone onto computer. haven’t done , recommend using usethis::create_from_github(\"almeidasilvaf/doubletrouble\", fork = TRUE). Install development dependencies devtools::install_dev_deps(), make sure package passes R CMD check running devtools::check(). R CMD check doesn’t pass cleanly, ’s good idea ask help continuing. Create Git branch pull request (PR). recommend using usethis::pr_init(\"brief-description--change\"). Make changes, commit git, create PR running usethis::pr_push(), following prompts browser. title PR briefly describe change. body PR contain Fixes #issue-number. user-facing changes, add bullet top NEWS.md (.e. just first header). Follow style described https://style.tidyverse.org/news.html.","code":""},{"path":"/CONTRIBUTING.html","id":"code-style","dir":"","previous_headings":"Bigger changes","what":"Code style","title":"Contributing to doubletrouble","text":"New code follow tidyverse style guide. can use styler package apply styles, please don’t restyle code nothing PR. use roxygen2, Markdown syntax, documentation. use testthat unit tests. Contributions test cases included easier accept.","code":""},{"path":"/CONTRIBUTING.html","id":"code-of-conduct","dir":"","previous_headings":"","what":"Code of Conduct","title":"Contributing to doubletrouble","text":"Please note doubletrouble project released Contributor Code Conduct. contributing project agree abide terms.","code":""},{"path":"/SUPPORT.html","id":null,"dir":"","previous_headings":"","what":"Getting help with doubletrouble","title":"Getting help with doubletrouble","text":"Thanks using doubletrouble! filing issue, places explore pieces put together make process smooth possible.","code":""},{"path":"/SUPPORT.html","id":"make-a-reprex","dir":"","previous_headings":"","what":"Make a reprex","title":"Getting help with doubletrouble","text":"Start making minimal reproducible example using reprex package. haven’t heard used reprex , ’re treat! Seriously, reprex make R-question-asking endeavors easier (pretty insane ROI five ten minutes ’ll take learn ’s ). additional reprex pointers, check Get help! section tidyverse site.","code":""},{"path":"/SUPPORT.html","id":"where-to-ask","dir":"","previous_headings":"","what":"Where to ask?","title":"Getting help with doubletrouble","text":"Armed reprex, next step figure ask. See also Bioconductor help website. ’s question: start community.rstudio.com, /StackOverflow. Bioconductor-related question, please ask Bioconductor Support Website using appropriate package tag (website send automatic email package authors). people answer questions. ’s bug: ’re right place, file issue. ’re sure: let community help figure ! problem bug feature request, can easily return report . opening new issue, sure search issues pull requests make sure bug hasn’t reported /already fixed development version. default, search pre-populated :issue :open. can edit qualifiers (e.g. :pr, :closed) needed. example, ’d simply remove :open search issues repo, open closed.","code":""},{"path":"/SUPPORT.html","id":"what-happens-next","dir":"","previous_headings":"","what":"What happens next?","title":"Getting help with doubletrouble","text":"efficient possible, development tidyverse packages tends bursty, shouldn’t worry don’t get immediate response. Typically don’t look repo sufficient quantity issues accumulates, ’s burst intense activity focus efforts. makes development efficient avoids expensive context switching problems, cost taking longer get back . process makes good reprex particularly important might multiple months initial report start working . can’t reproduce bug, can’t fix !","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"introduction","dir":"Articles","previous_headings":"","what":"Introduction","title":"Identification and classification of duplicated genes","text":"Gene genome duplications source raw genetic material evolution (Ohno 2013). However, whole-genome duplications (WGD) small-scale duplications (SSD) contribute genome evolution different manners. help explore different contributions WGD SSD evolution, developed doubletrouble, package can used identify classify duplicated genes whole-genome protein sequences, calculate substitution rates per substitution site (.e., KaK_a KsK_s) gene pairs, find peaks KsK_s distributions, classify gene pairs age groups.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"installation","dir":"Articles","previous_headings":"","what":"Installation","title":"Identification and classification of duplicated genes","text":"can install doubletrouble Bioconductor following code: , can load package:","code":"if(!requireNamespace(\"BiocManager\", quietly = TRUE)) {     install.packages(\"BiocManager\") }  BiocManager::install(\"doubletrouble\")  ## Check that you have a valid Bioconductor installation BiocManager::valid() library(doubletrouble)"},{"path":"/articles/doubletrouble_vignette.html","id":"data-description","dir":"Articles","previous_headings":"","what":"Data description","title":"Identification and classification of duplicated genes","text":"vignette, use protein sequences (primary transcripts ) genome annotation yeast species Saccharomyces cerevisiae Candida glabrata. Data obtained Ensembl Fungi release 54 (Yates et al. 2022). example data sets stored following objects: yeast_seq: list AAStringSet objects elements named Scerevisiae Cglabrata. yeast_annot: GRangesList object elements named Scerevisiae Cglabrata. IMPORTANT: protein sequences FASTA files directory, can read list AAStringSet objects function fasta2AAStringSetlist() Bioconductor package syntenet. Likewise, can get GRangesList object GFF/GTF files function gff2GRangesList(), also syntenet. goal identify classify duplicated genes S. cerevisiae genome. C. glabrata genome used outgroup identify transposed duplicates later vignette.","code":"# Load list of DIAMOND tabular output data(yeast_seq) head(yeast_seq) #> $Scerevisiae #> AAStringSet object of length 6600: #>        width seq                                            names                #>    [1]  4910 MSQDRILLDLDVVNQRLILFNS...SELPEMLSLILRQYFTDLASS YLR106C #>    [2]  4092 MCKNEARLANELIEFVAATVTG...NYERLQAKEVASSTEQLLQEM YKR054C #>    [3]  3744 MSLTEQIEQFASRFRDDDATLQ...IGSAVSPRNLARTDVNFMPWF YHR099W #>    [4]  3268 MVLFTRCEKARKEKLAAGYKPL...ETLRGSLLLAINEGHEGFGLA YDR457W #>    [5]  3144 MLESLAANLLNRLLGSYVENFD...SLYRNIAIAVREYNKYCEAIL YLL040C #>    ...   ... ... #> [6596]    25 MFSLSNSQYTCQDYISDHIWKTSSH                      YOR302W #> [6597]    25 MRAKWRKKRTRRLKRKRRKVRARSK                      YDL133C-A #> [6598]    24 MHSNNSRQILIPHQNENMFLTELY                       YDL247W-A #> [6599]    24 MLVLYRKRFSGFRFYFLSIFKYII                       YBR191W-A #> [6600]    16 MLSLIFYLRFPSYIRG                               YJR151W-A #>  #> $Cglabrata #> AAStringSet object of length 5293: #>        width seq                                            names                #>    [1]  4880 MSIQSADTVVFDLDKAFQRRDE...VELPEMLALILRQYFSDLASQ CAGL0M11616g #>    [2]  4336 MYCIIRLCLLLLYMVRFAAAIV...ITFLGIKKCIILLIIVVVSIA CAGL0I10147g #>    [3]  4041 MVQRNIELARYITTLLIGVCPK...NDIESKVLDDTKQLLNSIEYV CAGL0K08294g #>    [4]  3743 MASADQISEYAEKLKDDQQSLA...ISASVNPRNLAKTDISFMPWF CAGL0A01914g #>    [5]  3247 MVKLTRFEKLQKEKNAEYFKPF...DTLRGSLLIAINEGHEGFGLA CAGL0K06303g #>    ...   ... ... #> [5289]    43 MLGAPISRDTPRKTRSKTQFFQGPIVSLITEKCTYEWGNPSIN    CAGL0M02541g #> [5290]    39 MLPGGPIVVLILVGLAACIIVATIIYRKWQERQRALARF        CAGL0M03305g #> [5291]    39 MLPGGVILVFILVGLAACAIVAVIIYRKWQERQRSLQRF        CAGL0L08008g #> [5292]    37 MINEGQLQTLVIGFGLAMVVLVVVYHAVASTMAVKRD          CAGL0C05461g #> [5293]    34 MQPTIEATQKDNTQEKRDNYIVKGFFWSPDCVIA             CAGL0C01919g # Load annotation list processed with syntenet::process_input() data(yeast_annot) head(yeast_annot) #> GRangesList object of length 2: #> $Scerevisiae #> GRanges object with 27144 ranges and 9 metadata columns: #>           seqnames        ranges strand |       type     phase #>              <Rle>     <IRanges>  <Rle> |   <factor> <integer> #>       [1]        I      1-230218      * | chromosome      <NA> #>       [2]        I       335-649      + | gene            <NA> #>       [3]        I       335-649      + | mRNA            <NA> #>       [4]        I       335-649      + | exon            <NA> #>       [5]        I       335-649      + | CDS                0 #>       ...      ...           ...    ... .        ...       ... #>   [27140]      XVI 944603-947701      + |       CDS          0 #>   [27141]      XVI 946856-947338      - |       gene      <NA> #>   [27142]      XVI 946856-947338      - |       mRNA      <NA> #>   [27143]      XVI 946856-947338      - |       exon      <NA> #>   [27144]      XVI 946856-947338      - |       CDS          0 #>                               ID                 Parent              Name #>                      <character>        <CharacterList>       <character> #>       [1]           chromosome:I                                     <NA> #>       [2]           gene:YAL069W                                     <NA> #>       [3] transcript:YAL069W_m..           gene:YAL069W              <NA> #>       [4]                   <NA> transcript:YAL069W_m..   YAL069W_mRNA-E1 #>       [5]            CDS:YAL069W transcript:YAL069W_m..              <NA> #>       ...                    ...                    ...               ... #>   [27140]            CDS:YPR204W transcript:YPR204W_m..              <NA> #>   [27141]         gene:YPR204C-A                                     <NA> #>   [27142] transcript:YPR204C-A..         gene:YPR204C-A              <NA> #>   [27143]                   <NA> transcript:YPR204C-A.. YPR204C-A_mRNA-E1 #>   [27144]          CDS:YPR204C-A transcript:YPR204C-A..              <NA> #>               gene_id  transcript_id           exon_id  protein_id #>           <character>    <character>       <character> <character> #>       [1]        <NA>           <NA>              <NA>        <NA> #>       [2]     YAL069W           <NA>              <NA>        <NA> #>       [3]        <NA>   YAL069W_mRNA              <NA>        <NA> #>       [4]        <NA>           <NA>   YAL069W_mRNA-E1        <NA> #>       [5]        <NA>           <NA>              <NA>     YAL069W #>       ...         ...            ...               ...         ... #>   [27140]        <NA>           <NA>              <NA>     YPR204W #>   [27141]   YPR204C-A           <NA>              <NA>        <NA> #>   [27142]        <NA> YPR204C-A_mRNA              <NA>        <NA> #>   [27143]        <NA>           <NA> YPR204C-A_mRNA-E1        <NA> #>   [27144]        <NA>           <NA>              <NA>   YPR204C-A #>   ------- #>   seqinfo: 31 sequences from an unspecified genome; no seqlengths #>  #> $Cglabrata #> GRanges object with 31671 ranges and 9 metadata columns: #>                         seqnames      ranges strand |     type     phase #>                            <Rle>   <IRanges>  <Rle> | <factor> <integer> #>       [1] ChrA_C_glabrata_CBS138    1-491328      * |   region      <NA> #>       [2] ChrA_C_glabrata_CBS138   1608-2636      - |   gene        <NA> #>       [3] ChrA_C_glabrata_CBS138   1608-2636      - |   mRNA        <NA> #>       [4] ChrA_C_glabrata_CBS138   1608-2636      - |   exon        <NA> #>       [5] ChrA_C_glabrata_CBS138   1608-2636      - |   CDS            0 #>       ...                    ...         ...    ... .      ...       ... #>   [31667] mito_C_glabrata_CBS138 15384-16067      + |     CDS          0 #>   [31668] mito_C_glabrata_CBS138 16756-17565      + |     gene      <NA> #>   [31669] mito_C_glabrata_CBS138 16756-17565      + |     mRNA      <NA> #>   [31670] mito_C_glabrata_CBS138 16756-17565      + |     exon      <NA> #>   [31671] mito_C_glabrata_CBS138 16756-17565      + |     CDS          0 #>                               ID                 Parent              Name #>                      <character>        <CharacterList>       <character> #>       [1] region:ChrA_C_glabra..                                     <NA> #>       [2]      gene:CAGL0A00105g                                     <NA> #>       [3] transcript:CAGL0A001..      gene:CAGL0A00105g              <NA> #>       [4]                   <NA> transcript:CAGL0A001.. CAGL0A00105g-T-E1 #>       [5]  CDS:CAGL0A00105g-T-p1 transcript:CAGL0A001..              <NA> #>       ...                    ...                    ...               ... #>   [31667]     CDS:CaglfMp11-T-p1 transcript:CaglfMp11-T              <NA> #>   [31668]         gene:CaglfMp12                                     COX3 #>   [31669] transcript:CaglfMp12-T         gene:CaglfMp12              <NA> #>   [31670]                   <NA> transcript:CaglfMp12-T    CaglfMp12-T-E1 #>   [31671]     CDS:CaglfMp12-T-p1 transcript:CaglfMp12-T              <NA> #>                gene_id  transcript_id           exon_id        protein_id #>            <character>    <character>       <character>       <character> #>       [1]         <NA>           <NA>              <NA>              <NA> #>       [2] CAGL0A00105g           <NA>              <NA>              <NA> #>       [3]         <NA> CAGL0A00105g-T              <NA>              <NA> #>       [4]         <NA>           <NA> CAGL0A00105g-T-E1              <NA> #>       [5]         <NA>           <NA>              <NA> CAGL0A00105g-T-p1 #>       ...          ...            ...               ...               ... #>   [31667]         <NA>           <NA>              <NA>    CaglfMp11-T-p1 #>   [31668]    CaglfMp12           <NA>              <NA>              <NA> #>   [31669]         <NA>    CaglfMp12-T              <NA>              <NA> #>   [31670]         <NA>           <NA>    CaglfMp12-T-E1              <NA> #>   [31671]         <NA>           <NA>              <NA>    CaglfMp12-T-p1 #>   ------- #>   seqinfo: 31 sequences from an unspecified genome; no seqlengths"},{"path":"/articles/doubletrouble_vignette.html","id":"data-preparation","dir":"Articles","previous_headings":"","what":"Data preparation","title":"Identification and classification of duplicated genes","text":"First , need process list protein sequences gene ranges detect synteny syntenet. using function process_input() syntenet package. processed data represented list elements seq annotation, containing protein sequences gene ranges species, respectively. Finally, need perform pairwise sequence similarity searches identify whole set paralogous gene pairs. can using function run_diamond() syntenet package 1, setting compare = \"intraspecies\" perform intraspecies comparisons. voilà! Now DIAMOND output processed annotation, can classify duplicated genes.","code":"library(syntenet)  # Process input data pdata <- process_input(yeast_seq, yeast_annot)  # Inspect the output names(pdata) #> [1] \"seq\"        \"annotation\" pdata$seq #> $Scerevisiae #> AAStringSet object of length 6600: #>        width seq                                            names                #>    [1]  4910 MSQDRILLDLDVVNQRLILFNS...SELPEMLSLILRQYFTDLASS Sce_YLR106C #>    [2]  4092 MCKNEARLANELIEFVAATVTG...NYERLQAKEVASSTEQLLQEM Sce_YKR054C #>    [3]  3744 MSLTEQIEQFASRFRDDDATLQ...IGSAVSPRNLARTDVNFMPWF Sce_YHR099W #>    [4]  3268 MVLFTRCEKARKEKLAAGYKPL...ETLRGSLLLAINEGHEGFGLA Sce_YDR457W #>    [5]  3144 MLESLAANLLNRLLGSYVENFD...SLYRNIAIAVREYNKYCEAIL Sce_YLL040C #>    ...   ... ... #> [6596]    25 MFSLSNSQYTCQDYISDHIWKTSSH                      Sce_YOR302W #> [6597]    25 MRAKWRKKRTRRLKRKRRKVRARSK                      Sce_YDL133C-A #> [6598]    24 MHSNNSRQILIPHQNENMFLTELY                       Sce_YDL247W-A #> [6599]    24 MLVLYRKRFSGFRFYFLSIFKYII                       Sce_YBR191W-A #> [6600]    16 MLSLIFYLRFPSYIRG                               Sce_YJR151W-A #>  #> $Cglabrata #> AAStringSet object of length 5293: #>        width seq                                            names                #>    [1]  4880 MSIQSADTVVFDLDKAFQRRDE...VELPEMLALILRQYFSDLASQ Cgl_CAGL0M11616g #>    [2]  4336 MYCIIRLCLLLLYMVRFAAAIV...ITFLGIKKCIILLIIVVVSIA Cgl_CAGL0I10147g #>    [3]  4041 MVQRNIELARYITTLLIGVCPK...NDIESKVLDDTKQLLNSIEYV Cgl_CAGL0K08294g #>    [4]  3743 MASADQISEYAEKLKDDQQSLA...ISASVNPRNLAKTDISFMPWF Cgl_CAGL0A01914g #>    [5]  3247 MVKLTRFEKLQKEKNAEYFKPF...DTLRGSLLIAINEGHEGFGLA Cgl_CAGL0K06303g #>    ...   ... ... #> [5289]    43 MLGAPISRDTPRKTRSKTQFFQGPIVSLITEKCTYEWGNPSIN    Cgl_CAGL0M02541g #> [5290]    39 MLPGGPIVVLILVGLAACIIVATIIYRKWQERQRALARF        Cgl_CAGL0M03305g #> [5291]    39 MLPGGVILVFILVGLAACAIVAVIIYRKWQERQRSLQRF        Cgl_CAGL0L08008g #> [5292]    37 MINEGQLQTLVIGFGLAMVVLVVVYHAVASTMAVKRD          Cgl_CAGL0C05461g #> [5293]    34 MQPTIEATQKDNTQEKRDNYIVKGFFWSPDCVIA             Cgl_CAGL0C01919g pdata$annotation #> $Scerevisiae #> GRanges object with 6600 ranges and 1 metadata column: #>          seqnames        ranges strand |          gene #>             <Rle>     <IRanges>  <Rle> |   <character> #>      [1]    Sce_I       335-649      + |   Sce_YAL069W #>      [2]    Sce_I       538-792      + | Sce_YAL068W-A #>      [3]    Sce_I     1807-2169      - |   Sce_YAL068C #>      [4]    Sce_I     2480-2707      + | Sce_YAL067W-A #>      [5]    Sce_I     7235-9016      - |   Sce_YAL067C #>      ...      ...           ...    ... .           ... #>   [6596]  Sce_XVI 939922-941136      + |   Sce_YPR201W #>   [6597]  Sce_XVI 943032-943896      + |   Sce_YPR202W #>   [6598]  Sce_XVI 943880-944188      + |   Sce_YPR203W #>   [6599]  Sce_XVI 944603-947701      + |   Sce_YPR204W #>   [6600]  Sce_XVI 946856-947338      - | Sce_YPR204C-A #>   ------- #>   seqinfo: 17 sequences from an unspecified genome; no seqlengths #>  #> $Cglabrata #> GRanges object with 5293 ranges and 1 metadata column: #>                        seqnames      ranges strand |             gene #>                           <Rle>   <IRanges>  <Rle> |      <character> #>      [1] Cgl_ChrA_C_glabrata_..   1608-2636      - | Cgl_CAGL0A00105g #>      [2] Cgl_ChrA_C_glabrata_..   2671-4809      - | Cgl_CAGL0A00116g #>      [3] Cgl_ChrA_C_glabrata_.. 11697-13042      + | Cgl_CAGL0A00132g #>      [4] Cgl_ChrA_C_glabrata_.. 14977-15886      + | Cgl_CAGL0A00154g #>      [5] Cgl_ChrA_C_glabrata_.. 17913-19017      - | Cgl_CAGL0A00165g #>      ...                    ...         ...    ... .              ... #>   [5289] Cgl_mito_C_glabrata_.. 13275-13421      + |    Cgl_CaglfMp08 #>   [5290] Cgl_mito_C_glabrata_.. 13614-14396      + |    Cgl_CaglfMp09 #>   [5291] Cgl_mito_C_glabrata_.. 14631-14861      + |    Cgl_CaglfMp10 #>   [5292] Cgl_mito_C_glabrata_.. 15384-16067      + |    Cgl_CaglfMp11 #>   [5293] Cgl_mito_C_glabrata_.. 16756-17565      + |    Cgl_CaglfMp12 #>   ------- #>   seqinfo: 14 sequences from an unspecified genome; no seqlengths data(diamond_intra)  # Run DIAMOND in sensitive mode for S. cerevisiae only if(diamond_is_installed()) {     diamond_intra <- run_diamond(         seq = pdata$seq[\"Scerevisiae\"],         compare = \"intraspecies\",          outdir = file.path(tempdir(), \"diamond_intra\"),         ... = \"--sensitive\"     ) }  # Inspect output names(diamond_intra) #> [1] \"Scerevisiae_Scerevisiae\" head(diamond_intra$Scerevisiae_Scerevisiae) #>         query          db perc_identity length mismatches gap_open qstart qend #> 1 Sce_YLR106C Sce_YLR106C         100.0   4910          0        0      1 4910 #> 2 Sce_YLR106C Sce_YKR054C          22.4    420        254       19    804 1195 #> 3 Sce_YKR054C Sce_YKR054C         100.0   4092          0        0      1 4092 #> 4 Sce_YKR054C Sce_YLR106C          22.4    420        254       19   1823 2198 #> 5 Sce_YHR099W Sce_YHR099W         100.0   3744          0        0      1 3744 #> 6 Sce_YHR099W Sce_YJR066W          22.7    339        201       12   3351 3674 #>   tstart tend   evalue bitscore #> 1      1 4910 0.00e+00   9095.0 #> 2   1823 2198 1.30e-06     53.1 #> 3      1 4092 0.00e+00   7940.0 #> 4    804 1195 1.09e-06     53.1 #> 5      1 3744 0.00e+00   7334.0 #> 6   2074 2366 6.46e-08     57.0"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-duplicated-gene-pairs-and-genes","dir":"Articles","previous_headings":"","what":"Classifying duplicated gene pairs and genes","title":"Identification and classification of duplicated genes","text":"classify duplicated gene pairs based modes duplication, use function classify_gene_pairs(). function offers four different classification schemes, depending much detail want. classification schemes, along duplication modes identify required input, summarized table : Legend: SD, segmental duplication. SSD, small-scale duplication. TD, tandem duplication. PD, proximal duplication. TRD, transposon-derived duplication. rTRD, retrotransposon-derived duplication. dTRD, DNA transposon-derived duplication. DD, dispersed duplication. shown table, minimal input objects : blast_list: list data frames DIAMOND (BLASTp, etc.) tabular output intraspecies comparisons returned syntenet::run_diamond(..., compare = 'intraspecies'). annotation: processed annotation list (GRangesList object) returned syntenet::process_input(). However, also want identify transposon-derived duplicates (TRD) classify retrotransposon-derived duplicates (rTRD) DNA transposon-derived duplicates (dTRD), need following objects: blast_list: list data frames DIAMOND (BLASTp, etc.) tabular output interspecies comparisons (target species vs outgroup) returned syntenet::run_diamond(..., compare = <comparison_data_frame>). intron_counts: list data frames number introns per gene species, returned get_intron_counts(). , demonstrate classification scheme examples.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"the-binary-scheme-sd-vs-ssd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The binary scheme (SD vs SSD)","title":"Identification and classification of duplicated genes","text":"binary scheme classifies duplicates derived either segmental duplications (SD) small-scale duplications (SSD). identify segmental duplicates, function classify_gene_pairs() performs intragenome synteny detection scans syntenet classifies detected anchor pairs segmental duplicates. remaining pairs classified originating small-scale duplications. scheme can used specifying scheme = \"binary\" function classify_gene_pairs(). function returns list data frames, containing duplicated gene pairs modes duplication species (, one species, list length 1).","code":"# Binary scheme c_binary <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"binary\" )  # Inspecting the output names(c_binary) #> [1] \"Scerevisiae\" head(c_binary$Scerevisiae) #>           dup1        dup2 type #> 9  Sce_YDR457W Sce_YER125W  SSD #> 10 Sce_YDR457W Sce_YJR036C  SSD #> 11 Sce_YDR457W Sce_YGL141W  SSD #> 12 Sce_YDR457W Sce_YKL010C  SSD #> 15 Sce_YBR140C Sce_YOL081W  SSD #> 21 Sce_YBL088C Sce_YBR136W  SSD  # How many pairs are there for each duplication mode? table(c_binary$Scerevisiae$type) #>  #>   SD  SSD  #>  342 3246"},{"path":"/articles/doubletrouble_vignette.html","id":"the-standard-scheme-ssd-td-pd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The standard scheme (SSD → TD, PD, DD)","title":"Identification and classification of duplicated genes","text":"Gene pairs derived small-scale duplications can classified originating tandem duplications (TD, genes adjacent ), proximal duplications (PD, genes separated genes), dispersed duplications (DD, duplicates fit previous categories). default classification scheme classify_gene_pairs(), can specified setting scheme = \"standard\".","code":"# Standard scheme c_standard <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"standard\" )  # Inspecting the output names(c_standard) #> [1] \"Scerevisiae\" head(c_standard$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_standard$Scerevisiae$type) #>  #>   SD   TD   PD   DD  #>  342   42   80 3124"},{"path":"/articles/doubletrouble_vignette.html","id":"the-extended-scheme-ssd-td-pd-trd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The extended scheme (SSD → TD, PD, TRD, DD)","title":"Identification and classification of duplicated genes","text":"find transposon-derived duplicates (TRD), function classify_gene_pairs() detects syntenic regions target species outgroup species. Genes target species syntenic regions outgroup treated ancestral loci. , one gene duplicate pair ancestral locus, duplicate pair classified originating transposon-derived duplications. Since finding transposon-derived duplicates requires comparing target species outgroup species, first need perform similarity search target species outgroup. can syntenet::run_diamond(). parameter compare, pass 2-column data frame specifying comparisons made. 2 , identify duplicated gene pairs Saccharomyces cerevisiae using Candida glabrata outgroup. Now, pass interspecies DIAMOND output argument parameter blast_inter classify_gene_pairs().","code":"data(diamond_inter) # load pre-computed output in case DIAMOND is not installed  # Create data frame of comparisons to be made comparisons <- data.frame(     species = \"Scerevisiae\",     outgroup = \"Cglabrata\" ) comparisons #>       species  outgroup #> 1 Scerevisiae Cglabrata  # Run DIAMOND for the comparison we specified if(diamond_is_installed()) {     diamond_inter <- run_diamond(         seq = pdata$seq,         compare = comparisons,         outdir = file.path(tempdir(), \"diamond_inter\"),         ... = \"--sensitive\"     ) }  names(diamond_inter) #> [1] \"Scerevisiae_Cglabrata\" head(diamond_inter$Scerevisiae_Cglabrata) #>         query               db perc_identity length mismatches gap_open qstart #> 1 Sce_YLR106C Cgl_CAGL0M11616g          52.3   4989       2183       50      2 #> 2 Sce_YLR106C Cgl_CAGL0K08294g          23.1    347        215       12   1064 #> 3 Sce_YKR054C Cgl_CAGL0K08294g          26.5   4114       2753       81     83 #> 4 Sce_YKR054C Cgl_CAGL0M11616g          22.7    419        254       17   1823 #> 5 Sce_YHR099W Cgl_CAGL0A01914g          70.2   3761       1087       17      1 #> 6 Sce_YDR457W Cgl_CAGL0K06303g          55.5   3318       1355       39      1 #>   qend tstart tend   evalue bitscore #> 1 4909      5 4879 0.00e+00   4439.0 #> 2 1389   1770 2085 9.10e-07     53.5 #> 3 4089     87 4035 0.00e+00   1376.0 #> 4 2198    803 1194 7.59e-07     53.5 #> 5 3744      1 3743 0.00e+00   5200.0 #> 6 3268      1 3247 0.00e+00   3302.0 # Extended scheme c_extended <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"extended\",     blast_inter = diamond_inter )  # Inspecting the output names(c_extended) #> [1] \"Scerevisiae\" head(c_extended$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_extended$Scerevisiae$type) #>  #>   SD   TD   PD  TRD   DD  #>  342   42   80 1015 2109"},{"path":"/articles/doubletrouble_vignette.html","id":"the-full-scheme-ssd-td-pd-rtrd-dtrd-dd","dir":"Articles","previous_headings":"Classifying duplicated gene pairs and genes","what":"The full scheme (SSD → TD, PD, rTRD, dTRD, DD)","title":"Identification and classification of duplicated genes","text":"Finally, full scheme consists classifying transposon-derived duplicates (TRD) originating retrotransposons (rTRD) DNA transposons (dTRD). , function classify_gene_pairs() uses number introns per gene find TRD pairs one gene least 1 intron, gene introns; case, pair classified originating activity retrotransposons (rTRD, .e., transposed gene without introns processed transcript retrotransposed back genome). TRD pairs classified DNA transposon-derived duplicates (dTRD). classify duplicates using scheme, first need create list data frames number introns per gene species. can done function get_intron_counts(), takes TxDb object input. TxDb objects store transcript annotations, can created family functions named makeTxDbFrom* txdbmaker package (see ?get_intron_counts() summary functions). , create list TxDb objects list GRanges objects using function makeTxDbFromGRanges() txdbmaker. Importantly, create TxDb GRanges, GRanges object must contain genomic coordinates features, including transcripts, exons, etc. , use annotation example data set yeast_annot, processed syntenet::process_input(). TxDb objects, can get intron counts per gene get_intron_counts(). Finally, can use list classify duplicates using full scheme follows:","code":"library(txdbmaker) # Create a list of `TxDb` objects from a list of `GRanges` objects txdb_list <- lapply(yeast_annot, txdbmaker::makeTxDbFromGRanges) txdb_list #> $Scerevisiae #> TxDb object: #> # Db type: TxDb #> # Supporting package: GenomicFeatures #> # Genome: NA #> # Nb of transcripts: 6631 #> # Db created by: txdbmaker package from Bioconductor #> # Creation time: 2024-10-02 09:49:23 +0000 (Wed, 02 Oct 2024) #> # txdbmaker version at creation time: 1.1.1 #> # RSQLite version at creation time: 2.3.7 #> # DBSCHEMAVERSION: 1.2 #>  #> $Cglabrata #> TxDb object: #> # Db type: TxDb #> # Supporting package: GenomicFeatures #> # Genome: NA #> # Nb of transcripts: 5389 #> # Db created by: txdbmaker package from Bioconductor #> # Creation time: 2024-10-02 09:49:23 +0000 (Wed, 02 Oct 2024) #> # txdbmaker version at creation time: 1.1.1 #> # RSQLite version at creation time: 2.3.7 #> # DBSCHEMAVERSION: 1.2 # Get a list of data frames with intron counts per gene for each species intron_counts <- lapply(txdb_list, get_intron_counts)  # Inspecting the list names(intron_counts) #> [1] \"Scerevisiae\" \"Cglabrata\" head(intron_counts$Scerevisiae) #>    gene introns #> 1 Q0045       7 #> 2 Q0105       5 #> 3 Q0070       4 #> 4 Q0065       3 #> 5 Q0120       3 #> 6 Q0060       2 # Full scheme c_full <- classify_gene_pairs(     annotation = pdata$annotation,     blast_list = diamond_intra,     scheme = \"full\",     blast_inter = diamond_inter,     intron_counts = intron_counts )  # Inspecting the output names(c_full) #> [1] \"Scerevisiae\" head(c_full$Scerevisiae) #>            dup1        dup2 type #> 124 Sce_YGR032W Sce_YLR342W   SD #> 176 Sce_YOR396W Sce_YPL283C   SD #> 189 Sce_YJL225C Sce_YIL177C   SD #> 275 Sce_YNR031C Sce_YCR073C   SD #> 285 Sce_YOR326W Sce_YAL029C   SD #> 312 Sce_YJL222W Sce_YIL173W   SD  # How many pairs are there for each duplication mode? table(c_full$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  342   42   80   52  963 2109"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-genes-into-unique-modes-of-duplication","dir":"Articles","previous_headings":"","what":"Classifying genes into unique modes of duplication","title":"Identification and classification of duplicated genes","text":"look carefully output classify_gene_pairs(), notice genes appear one duplicate pair, pairs can different duplication modes assigned. ’s nothing wrong . Consider, example, gene originated segmental duplication 60 million years ago, underwent tandem duplication 5 million years ago. output classify_gene_pairs(), ’d see gene two pairs, one SD type column, one TD. want assign gene unique mode duplication, can use function classify_genes(). function assigns duplication modes hierarchically using factor levels column type priority order. priority orders classification scheme : Binary: SD > SSD. Standard: SD > TD > PD > DD. Extended: SD > TD > PD > TRD > DD. Full: SD > TD > PD > rTRD > dTRD > DD. input classify_genes() list gene pairs returned classify_gene_pairs().","code":"# Classify genes into unique modes of duplication c_genes <- classify_genes(c_full)  # Inspecting the output names(c_genes) #> [1] \"Scerevisiae\" head(c_genes$Scerevisiae) #>          gene type #> 1 Sce_YGR032W   SD #> 2 Sce_YOR396W   SD #> 3 Sce_YJL225C   SD #> 4 Sce_YNR031C   SD #> 5 Sce_YOR326W   SD #> 6 Sce_YJL222W   SD  # Number of genes per mode table(c_genes$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  683   67   70   71  883  836"},{"path":"/articles/doubletrouble_vignette.html","id":"calculating-substitution-rates-for-duplicated-gene-pairs","dir":"Articles","previous_headings":"","what":"Calculating substitution rates for duplicated gene pairs","title":"Identification and classification of duplicated genes","text":"can use function pairs2kaks() calculate rates nonsynonymous substitutions per nonsynonymous site (KaK_a), synonymouys substitutions per synonymous site (KsK_s), ratios (Ka/KsK_a/K_s). rates calculated using Bioconductor package MSA2dist, implements codon models KaKs_Calculator 2.0 (Wang et al. 2010). purpose demonstration, calculate KaK_a, KsK_s, Ka/KsK_a/K_s 5 TD-derived gene pairs. CDS TD-derived genes obtained Ensembl Fungi (Yates et al. 2022), stored cds_scerevisiae. Importantly, pairs2kaks() expects genes gene pairs present CDS, matching names. Species abbreviations gene pairs (added syntenet) automatically removed, add sequence names CDS.","code":"data(cds_scerevisiae) head(cds_scerevisiae) #> DNAStringSet object of length 6: #>     width seq                                               names                #> [1]  3486 ATGGTTAATATAAGCATCGTAGC...TTGTCGCTTTATTACTGCTATAG YJR151C #> [2]  3276 ATGGGCGAAGGAACTACTAAGGA...TTAATATTGGTATTAAACAATGA YDR040C #> [3]  3276 ATGAGCGAGGGAACTGTCAAAGA...TTAATATCAGTGTCAAGCATTAA YDR038C #> [4]  3276 ATGAGCGAGGGAACTGTCAAAGA...TTAATATTGGTATTAAACAATGA YDR039C #> [5]  2925 ATGAACAGTATGGCCGATACCGA...CCATTACAACATTTCAAACATAA YAR019C #> [6]  2646 ATGCTGGAGTTTCCAATATCAGT...TAGCTGTTCTGTTCGCCTTCTAG YJL078C  # Store DNAStringSet object in a list cds_list <- list(Scerevisiae = cds_scerevisiae)  # Keep only top five TD-derived gene pairs for demonstration purposes td_pairs <- c_full$Scerevisiae[c_full$Scerevisiae$type == \"TD\", ] gene_pairs <- list(Scerevisiae = td_pairs[seq(1, 5, by = 1), ])  # Calculate Ka, Ks, and Ka/Ks kaks <- pairs2kaks(gene_pairs, cds_list)  # Inspect the output head(kaks) #> $Scerevisiae #>    dup1  dup2       Ka       Ks    Ka_Ks type #> 1 Q0055 Q0060      NaN      NaN      NaN   TD #> 2 Q0065 Q0060 0.799925 3.549370 0.225371   TD #> 3 Q0070 Q0045 0.296216 0.438575 0.675405   TD #> 4 Q0070 Q0065 0.394617 0.582050 0.677977   TD #> 5 Q0055 Q0050 0.629343 4.257430 0.147822   TD"},{"path":"/articles/doubletrouble_vignette.html","id":"identifying-and-visualizing-k_s-peaks","dir":"Articles","previous_headings":"","what":"Identifying and visualizing KsK_s peaks","title":"Identification and classification of duplicated genes","text":"Peaks KsK_s distributions typically indicate whole-genome duplication (WGD) events, can identified fitting Gaussian mixture models (GMMs) KsK_s distributions. doubletrouble, can performed function find_ks_peaks(). However, saturation higher KsK_s values, recent WGD events can reliably identified KsK_s distributions (Vanneste, Van de Peer, Maere 2013). Recent WGD events commonly found plant species, maize, soybean, apple, etc. Although genomes yeast species signatures WGD, events ancient, hard find evidence using KsK_s distributions. 3 demonstrate can find peaks KsK_s distributions find_ks_peaks(), use data frame containing KsK_s values duplicate pairs soybean (Glycine max) genome, undergone 2 WGDs events ~13 ~58 million years ago (Schmutz et al. 2010). , visualize KsK_s distributions peaks using function plot_ks_peaks(). First , let’s look data quick look distribution function plot_ks_distro() (details function data visualization section).  visual inspection, can see 2 3 peaks. Based prior knowledge, know 2 WGD events occurred ancestral Glycine genus ancestral Fabaceae, seem correspond peaks see KsK_s values around 0.1 0.5, respectively. third, flattened peak around 1.6, represent WGD shared eudicots. Let’s test number peaks support: 2 3.  can see, presence 3 peaks supported (lowest BIC). function returns list mean, variance amplitude mixture components (.e., peaks), well KsK_s distribution . Now, suppose just want get first 2 peaks. can explictly saying find_ks_peaks() many peaks .  Important consideration GMMs KsK_s distributions: Peaks identified GMMs blindly regarded “truth”. Using GMMs find peaks KsK_s distributions can lead problems overfitting overclustering (Tiley, Barker, Burleigh 2018). general recommendations : Use prior knowledge. know many peaks (e.g., based literature evidence), just tell number find_ks_peaks(). Likewise, sure many peaks , know maximum number peaks N, don’t test presence >N peaks. GMMs can incorrectly identify peaks actual number. Test significance peak SiZer (Significant ZERo crossings derivatives) maps (Chaudhuri Marron 1999). can done function SiZer() R package feature. example SiZer map, let’s use feature::SiZer() assess significance 2 peaks found previously.  blue regions SiZer map indicate significantly increasing regions curve, support 2 peaks found.","code":"# Load data and inspect it data(gmax_ks) head(gmax_ks) #>              dup1            dup2     Ks type #> 1 GLYMA_07G035600 GLYMA_16G004800 0.1670   SD #> 2 GLYMA_18G275200 GLYMA_08G252600 0.1070   SD #> 3 GLYMA_09G282200 GLYMA_20G003400 0.0822   SD #> 4 GLYMA_01G166400 GLYMA_11G077000 0.0904   SD #> 5 GLYMA_07G252100 GLYMA_17G022300 0.1400   SD #> 6 GLYMA_05G133100 GLYMA_08G087600 0.0883   SD  # Plot distribution plot_ks_distro(gmax_ks) # Find 2 and 3 peaks and test which one has more support peaks <- find_ks_peaks(gmax_ks$Ks, npeaks = c(2, 3), verbose = TRUE) #> Optimal number of peaks: 3 #> Bayesian Information Criterion (BIC):  #>            E         V #> 2 -100166.88 -88545.37 #> 3  -90965.45 -75323.66 #>  #> Top 3 models based on the BIC criterion:  #>       V,3       V,2       E,3  #> -75323.66 -88545.37 -90965.45 names(peaks) #> [1] \"mean\"   \"sd\"     \"lambda\" \"ks\" str(peaks) #> List of 4 #>  $ mean  : Named num [1:3] 0.123 0.601 1.596 #>   ..- attr(*, \"names\")= chr [1:3] \"1\" \"2\" \"3\" #>  $ sd    : num [1:3] 0.0572 0.287 0.2503 #>  $ lambda: num [1:3] 0.285 0.44 0.276 #>  $ ks    : num [1:68085] 0.167 0.107 0.0822 0.0904 0.14 0.0883 0.107 0.756 0.737 0.0872 ...  # Visualize Ks distribution plot_ks_peaks(peaks) # Find 2 peaks ignoring Ks values > 1 peaks <- find_ks_peaks(gmax_ks$Ks, npeaks = 2, max_ks = 1) plot_ks_peaks(peaks) # Get numeric vector of Ks values <= 1 ks <- gmax_ks$Ks[gmax_ks$Ks <= 1]  # Get SiZer map feature::SiZer(ks) #> Warning: no DISPLAY variable so Tk is not available"},{"path":"/articles/doubletrouble_vignette.html","id":"classifying-genes-by-age-groups","dir":"Articles","previous_headings":"","what":"Classifying genes by age groups","title":"Identification and classification of duplicated genes","text":"Finally, can use peaks obtained classify gene pairs age group. Age groups defined based KsK_s peak pairs belong. useful want analyze duplicate pairs specific WGD event, instance. can function split_pairs_by_peak(). function returns list containing classified pairs data frame, ggplot object age boundaries highlighted histogram KsK_s values.  Age groups can also used identify SD gene pairs likely originated whole-genome duplications. rationale segmental duplicates KsK_s values near KsK_s peaks (indicating WGD events) likely created WGDs. similar logic, SD pairs KsK_s values distant KsK_s peaks (e.g., >2 standard deviations away mean) likely created duplications large genomic segments, duplications entire genome. example, find gene pairs soybean genome likely originated WGD event shared legumes (~58 million years ago), ’d need extract SD pairs age group 2 using following code:","code":"# Gene pairs without age-based classification head(gmax_ks) #>              dup1            dup2     Ks type #> 1 GLYMA_07G035600 GLYMA_16G004800 0.1670   SD #> 2 GLYMA_18G275200 GLYMA_08G252600 0.1070   SD #> 3 GLYMA_09G282200 GLYMA_20G003400 0.0822   SD #> 4 GLYMA_01G166400 GLYMA_11G077000 0.0904   SD #> 5 GLYMA_07G252100 GLYMA_17G022300 0.1400   SD #> 6 GLYMA_05G133100 GLYMA_08G087600 0.0883   SD  # Classify gene pairs by age group pairs_age_group <- split_pairs_by_peak(gmax_ks[, c(1,2,3)], peaks)  # Inspecting the output names(pairs_age_group) #> [1] \"pairs\" \"plot\"  # Take a look at the classified gene pairs head(pairs_age_group$pairs) #>              dup1            dup2     ks peak #> 1 GLYMA_07G035600 GLYMA_16G004800 0.1670    1 #> 2 GLYMA_18G275200 GLYMA_08G252600 0.1070    1 #> 3 GLYMA_09G282200 GLYMA_20G003400 0.0822    1 #> 4 GLYMA_01G166400 GLYMA_11G077000 0.0904    1 #> 5 GLYMA_07G252100 GLYMA_17G022300 0.1400    1 #> 6 GLYMA_05G133100 GLYMA_08G087600 0.0883    1  # Visualize Ks distro with age boundaries pairs_age_group$plot # Get all pairs in age group 2 pairs_ag2 <- pairs_age_group$pairs[pairs_age_group$pairs$peak == 2, c(1,2)]  # Get all SD pairs sd_pairs <- gmax_ks[gmax_ks$type == \"SD\", c(1,2)]  # Merge tables pairs_wgd_legumes <- merge(pairs_ag2, sd_pairs)  head(pairs_wgd_legumes) #>              dup1            dup2 #> 1 GLYMA_01G001800 GLYMA_07G130700 #> 2 GLYMA_01G002100 GLYMA_05G221300 #> 3 GLYMA_01G002300 GLYMA_07G130100 #> 4 GLYMA_01G002600 GLYMA_07G129700 #> 5 GLYMA_01G003500 GLYMA_05G222800 #> 6 GLYMA_01G003500 GLYMA_08G029700"},{"path":"/articles/doubletrouble_vignette.html","id":"data-visualization","dir":"Articles","previous_headings":"","what":"Data visualization","title":"Identification and classification of duplicated genes","text":"Last least, doubletrouble provides users graphical functions produce publication-ready plots output classify_gene_pairs(), classify_genes(), pairs2kaks(). Let’s take look one one.","code":""},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-the-frequency-of-duplicates-per-mode","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing the frequency of duplicates per mode","title":"Identification and classification of duplicated genes","text":"visualize frequency duplicated gene pairs genes duplication type (returned classify_gene_pairs() classify_genes(), respectively), first need create data frame counts duplicates2counts(). demonstrate works, use example data set duplicate pairs 3 fungi species (substitution rates, ignored duplicates2counts()). Now, let’s visualize frequency duplicate gene pairs duplication type function plot_duplicate_freqs(). can visualize frequencies three different ways, demonstrated .  want visually frequency duplicated genes (gene pairs), ’d first need classify genes unique modes duplication classify_genes(), repeat code . example:","code":"# Load data set with pre-computed duplicates for 3 fungi species data(fungi_kaks) names(fungi_kaks) #> [1] \"saccharomyces_cerevisiae\"  \"candida_glabrata\"          #> [3] \"schizosaccharomyces_pombe\" head(fungi_kaks$saccharomyces_cerevisiae) #>      dup1    dup2       Ka       Ks  Ka_Ks type #> 1 YGR032W YLR342W 0.058800 5.240000 0.0112   SD #> 2 YOR396W YPL283C 0.004010 0.009920 0.4040   SD #> 3 YJL225C YIL177C 0.000253 0.000758 0.3340   SD #> 4 YNR031C YCR073C 0.364000 5.070000 0.0718   SD #> 5 YOR326W YAL029C 0.396000 5.150000 0.0769   SD #> 6 YJL222W YIL173W 0.000276       NA     NA   SD  # Get a data frame of counts per mode in all species counts_table <- duplicates2counts(fungi_kaks |> classify_genes())  counts_table #>    type    n                   species #> 1    SD  683  saccharomyces_cerevisiae #> 2    TD   67  saccharomyces_cerevisiae #> 3    PD   70  saccharomyces_cerevisiae #> 4  rTRD    0  saccharomyces_cerevisiae #> 5  dTRD    0  saccharomyces_cerevisiae #> 6    DD 1790  saccharomyces_cerevisiae #> 7    SD   14          candida_glabrata #> 8    TD  104          candida_glabrata #> 9    PD   42          candida_glabrata #> 10 rTRD    0          candida_glabrata #> 11 dTRD    0          candida_glabrata #> 12   DD 1907          candida_glabrata #> 13   SD   53 schizosaccharomyces_pombe #> 14   TD   38 schizosaccharomyces_pombe #> 15   PD   48 schizosaccharomyces_pombe #> 16 rTRD    0 schizosaccharomyces_pombe #> 17 dTRD    0 schizosaccharomyces_pombe #> 18   DD 1853 schizosaccharomyces_pombe # A) Facets p1 <- plot_duplicate_freqs(counts_table)  # B) Stacked barplot, absolute frequencies p2 <- plot_duplicate_freqs(counts_table, plot_type = \"stack\")  # C) Stacked barplot, relative frequencies p3 <- plot_duplicate_freqs(counts_table, plot_type = \"stack_percent\")  # Combine plots, one per row patchwork::wrap_plots(p1, p2, p3, nrow = 3) +      patchwork::plot_annotation(tag_levels = \"A\") # Frequency of duplicated genes by mode classify_genes(fungi_kaks) |>   # classify genes into unique duplication types     duplicates2counts() |>      # get a data frame of counts (long format)     plot_duplicate_freqs()      # plot frequencies"},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-k_s-distributions","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing KsK_s distributions","title":"Identification and classification of duplicated genes","text":"briefly demonstrated , plot KsK_s distribution whole paranome, use function plot_ks_distro().  However, visualizing distribution whole paranome can mask patterns happen duplicates originating particular duplication types. instance, looking evidence WGD events, visualizing KsK_s distribution SD-derived pairs can reveal whether syntenic genes cluster together, suggesting presence WGD history. visualize distribution duplication type, use bytype = TRUE plot_ks_distro().","code":"ks_df <- fungi_kaks$saccharomyces_cerevisiae  # A) Histogram, whole paranome p1 <- plot_ks_distro(ks_df, plot_type = \"histogram\")  # B) Density, whole paranome p2 <- plot_ks_distro(ks_df, plot_type = \"density\")   # C) Histogram with density lines, whole paranome p3 <- plot_ks_distro(ks_df, plot_type = \"density_histogram\")  # Combine plots side by side patchwork::wrap_plots(p1, p2, p3, nrow = 1) +     patchwork::plot_annotation(tag_levels = \"A\") # A) Duplicates by type, histogram p1 <- plot_ks_distro(ks_df, bytype = TRUE, plot_type = \"histogram\")  # B) Duplicates by type, violin p2 <- plot_ks_distro(ks_df, bytype = TRUE, plot_type = \"violin\")  # Combine plots side by side patchwork::wrap_plots(p1, p2) +     patchwork::plot_annotation(tag_levels = \"A\")"},{"path":"/articles/doubletrouble_vignette.html","id":"visualizing-substitution-rates-by-species","dir":"Articles","previous_headings":"Data visualization","what":"Visualizing substitution rates by species","title":"Identification and classification of duplicated genes","text":"function plot_rates_by_species() can used show distributions substitution rates (KsK_s, KaK_a, ratio Ka/KsK_a/K_s) species. can choose rate want visualize, whether group gene pairs duplication mode, demonstrated .","code":"# A) Ks for each species p1 <- plot_rates_by_species(fungi_kaks)  # B) Ka/Ks by duplication type for each species p2 <- plot_rates_by_species(fungi_kaks, rate_column = \"Ka_Ks\", bytype = TRUE)  # Combine plots - one per row patchwork::wrap_plots(p1, p2, nrow = 2) +     patchwork::plot_annotation(tag_levels = \"A\")"},{"path":"/articles/doubletrouble_vignette.html","id":"session-information","dir":"Articles","previous_headings":"","what":"Session information","title":"Identification and classification of duplicated genes","text":"document created following conditions:","code":"sessioninfo::session_info() #> ─ Session info ─────────────────────────────────────────────────────────────── #>  setting  value #>  version  R version 4.4.1 (2024-06-14) #>  os       Ubuntu 22.04.5 LTS #>  system   x86_64, linux-gnu #>  ui       X11 #>  language en #>  collate  en_US.UTF-8 #>  ctype    en_US.UTF-8 #>  tz       UTC #>  date     2024-10-02 #>  pandoc   3.4 @ /usr/bin/ (via rmarkdown) #>  #> ─ Packages ─────────────────────────────────────────────────────────────────── #>  package              * version   date (UTC) lib source #>  abind                  1.4-8     2024-09-12 [1] RSPM (R 4.4.0) #>  ade4                   1.7-22    2023-02-06 [1] RSPM (R 4.4.0) #>  AnnotationDbi        * 1.67.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  ape                    5.8       2024-04-11 [1] RSPM (R 4.4.0) #>  Biobase              * 2.65.1    2024-08-28 [1] Bioconductor 3.20 (R 4.4.1) #>  BiocFileCache          2.13.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocGenerics         * 0.51.2    2024-09-27 [1] Bioconductor 3.20 (R 4.4.1) #>  BiocIO                 1.15.2    2024-08-23 [1] Bioconductor 3.20 (R 4.4.1) #>  BiocManager            1.30.25   2024-08-28 [2] CRAN (R 4.4.1) #>  BiocParallel           1.39.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  BiocStyle            * 2.33.1    2024-06-12 [1] Bioconductor 3.20 (R 4.4.0) #>  biomaRt                2.61.3    2024-08-06 [1] Bioconductor 3.20 (R 4.4.1) #>  Biostrings             2.73.2    2024-09-26 [1] Bioconductor 3.20 (R 4.4.1) #>  bit                    4.5.0     2024-09-20 [1] RSPM (R 4.4.0) #>  bit64                  4.5.2     2024-09-22 [1] RSPM (R 4.4.0) #>  bitops                 1.0-8     2024-07-29 [1] RSPM (R 4.4.0) #>  blob                   1.2.4     2023-03-17 [1] RSPM (R 4.4.0) #>  bookdown               0.40      2024-07-02 [1] RSPM (R 4.4.0) #>  bslib                  0.8.0     2024-07-29 [2] RSPM (R 4.4.0) #>  cachem                 1.1.0     2024-05-16 [2] RSPM (R 4.4.0) #>  cli                    3.6.3     2024-06-21 [2] RSPM (R 4.4.0) #>  coda                   0.19-4.1  2024-01-31 [1] RSPM (R 4.4.0) #>  codetools              0.2-20    2024-03-31 [3] CRAN (R 4.4.1) #>  colorspace             2.1-1     2024-07-26 [1] RSPM (R 4.4.0) #>  crayon                 1.5.3     2024-06-20 [2] RSPM (R 4.4.0) #>  curl                   5.2.3     2024-09-20 [2] RSPM (R 4.4.0) #>  DBI                    1.2.3     2024-06-02 [1] RSPM (R 4.4.0) #>  dbplyr                 2.5.0     2024-03-19 [1] RSPM (R 4.4.0) #>  DelayedArray           0.31.12   2024-09-27 [1] Bioconductor 3.20 (R 4.4.1) #>  desc                   1.4.3     2023-12-10 [2] RSPM (R 4.4.0) #>  digest                 0.6.37    2024-08-19 [2] RSPM (R 4.4.0) #>  doParallel             1.0.17    2022-02-07 [1] RSPM (R 4.4.0) #>  doubletrouble        * 1.5.2     2024-10-02 [1] Bioconductor #>  dplyr                  1.1.4     2023-11-17 [1] RSPM (R 4.4.0) #>  evaluate               1.0.0     2024-09-17 [2] RSPM (R 4.4.0) #>  fansi                  1.0.6     2023-12-08 [2] RSPM (R 4.4.0) #>  farver                 2.1.2     2024-05-13 [1] RSPM (R 4.4.0) #>  fastmap                1.2.0     2024-05-15 [2] RSPM (R 4.4.0) #>  feature                1.2.15    2021-02-10 [1] RSPM (R 4.4.0) #>  filelock               1.0.3     2023-12-11 [1] RSPM (R 4.4.0) #>  foreach                1.5.2     2022-02-02 [1] RSPM (R 4.4.0) #>  fs                     1.6.4     2024-04-25 [2] RSPM (R 4.4.0) #>  generics               0.1.3     2022-07-05 [1] RSPM (R 4.4.0) #>  GenomeInfoDb         * 1.41.1    2024-05-24 [1] Bioconductor 3.20 (R 4.4.0) #>  GenomeInfoDbData       1.2.13    2024-10-02 [1] Bioconductor #>  GenomicAlignments      1.41.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  GenomicFeatures      * 1.57.1    2024-09-27 [1] Bioconductor 3.20 (R 4.4.1) #>  GenomicRanges        * 1.57.1    2024-06-12 [1] Bioconductor 3.20 (R 4.4.0) #>  ggnetwork              0.5.13    2024-02-14 [1] RSPM (R 4.4.0) #>  ggplot2                3.5.1     2024-04-23 [1] RSPM (R 4.4.0) #>  glue                   1.8.0     2024-09-30 [2] RSPM (R 4.4.0) #>  gtable                 0.3.5     2024-04-22 [1] RSPM (R 4.4.0) #>  highr                  0.11      2024-05-26 [2] RSPM (R 4.4.0) #>  hms                    1.1.3     2023-03-21 [1] RSPM (R 4.4.0) #>  htmltools              0.5.8.1   2024-04-04 [2] RSPM (R 4.4.0) #>  htmlwidgets            1.6.4     2023-12-06 [2] RSPM (R 4.4.0) #>  httr                   1.4.7     2023-08-15 [1] RSPM (R 4.4.0) #>  httr2                  1.0.5     2024-09-26 [2] RSPM (R 4.4.0) #>  igraph                 2.0.3     2024-03-13 [1] RSPM (R 4.4.0) #>  intergraph             2.0-4     2024-02-01 [1] RSPM (R 4.4.0) #>  IRanges              * 2.39.2    2024-07-17 [1] Bioconductor 3.20 (R 4.4.1) #>  iterators              1.0.14    2022-02-05 [1] RSPM (R 4.4.0) #>  jquerylib              0.1.4     2021-04-26 [2] RSPM (R 4.4.0) #>  jsonlite               1.8.9     2024-09-20 [2] RSPM (R 4.4.0) #>  KEGGREST               1.45.1    2024-06-17 [1] Bioconductor 3.20 (R 4.4.0) #>  KernSmooth             2.23-24   2024-05-17 [3] CRAN (R 4.4.1) #>  knitr                  1.48      2024-07-07 [2] RSPM (R 4.4.0) #>  ks                     1.14.3    2024-09-20 [1] RSPM (R 4.4.0) #>  labeling               0.4.3     2023-08-29 [1] RSPM (R 4.4.0) #>  lattice                0.22-6    2024-03-20 [3] CRAN (R 4.4.1) #>  lifecycle              1.0.4     2023-11-07 [2] RSPM (R 4.4.0) #>  magrittr               2.0.3     2022-03-30 [2] RSPM (R 4.4.0) #>  MASS                   7.3-61    2024-06-13 [2] RSPM (R 4.4.0) #>  Matrix                 1.7-0     2024-04-26 [3] CRAN (R 4.4.1) #>  MatrixGenerics         1.17.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  matrixStats            1.4.1     2024-09-08 [1] RSPM (R 4.4.0) #>  mclust                 6.1.1     2024-04-29 [1] RSPM (R 4.4.0) #>  memoise                2.0.1     2021-11-26 [2] RSPM (R 4.4.0) #>  MSA2dist               1.9.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  munsell                0.5.1     2024-04-01 [1] RSPM (R 4.4.0) #>  mvtnorm                1.3-1     2024-09-03 [1] RSPM (R 4.4.0) #>  network                1.18.2    2023-12-05 [1] RSPM (R 4.4.0) #>  networkD3              0.4       2017-03-18 [1] RSPM (R 4.4.0) #>  nlme                   3.1-166   2024-08-14 [2] RSPM (R 4.4.0) #>  patchwork              1.3.0     2024-09-16 [1] RSPM (R 4.4.0) #>  pheatmap               1.0.12    2019-01-04 [1] RSPM (R 4.4.0) #>  pillar                 1.9.0     2023-03-22 [2] RSPM (R 4.4.0) #>  pkgconfig              2.0.3     2019-09-22 [2] RSPM (R 4.4.0) #>  pkgdown                2.1.1     2024-09-17 [2] RSPM (R 4.4.0) #>  png                    0.1-8     2022-11-29 [1] RSPM (R 4.4.0) #>  pracma                 2.4.4     2023-11-10 [1] RSPM (R 4.4.0) #>  prettyunits            1.2.0     2023-09-24 [2] RSPM (R 4.4.0) #>  progress               1.2.3     2023-12-06 [1] RSPM (R 4.4.0) #>  purrr                  1.0.2     2023-08-10 [2] RSPM (R 4.4.0) #>  pwalign                1.1.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  R6                     2.5.1     2021-08-19 [2] RSPM (R 4.4.0) #>  ragg                   1.3.3     2024-09-11 [2] RSPM (R 4.4.0) #>  rappdirs               0.3.3     2021-01-31 [2] RSPM (R 4.4.0) #>  RColorBrewer           1.1-3     2022-04-03 [1] RSPM (R 4.4.0) #>  Rcpp                   1.0.13    2024-07-17 [2] RSPM (R 4.4.0) #>  RCurl                  1.98-1.16 2024-07-11 [1] RSPM (R 4.4.0) #>  restfulr               0.0.15    2022-06-16 [1] RSPM (R 4.4.0) #>  rjson                  0.2.23    2024-09-16 [1] RSPM (R 4.4.0) #>  rlang                  1.1.4     2024-06-04 [2] RSPM (R 4.4.0) #>  rmarkdown              2.28      2024-08-17 [2] RSPM (R 4.4.0) #>  Rsamtools              2.21.2    2024-09-26 [1] Bioconductor 3.20 (R 4.4.1) #>  RSQLite                2.3.7     2024-05-27 [1] RSPM (R 4.4.0) #>  rtracklayer            1.65.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  S4Arrays               1.5.10    2024-09-29 [1] Bioconductor 3.20 (R 4.4.1) #>  S4Vectors            * 0.43.2    2024-07-17 [1] Bioconductor 3.20 (R 4.4.1) #>  sass                   0.4.9     2024-03-15 [2] RSPM (R 4.4.0) #>  scales                 1.3.0     2023-11-28 [1] RSPM (R 4.4.0) #>  seqinr                 4.2-36    2023-12-08 [1] RSPM (R 4.4.0) #>  sessioninfo            1.2.2     2021-12-06 [2] RSPM (R 4.4.0) #>  SparseArray            1.5.41    2024-09-27 [1] Bioconductor 3.20 (R 4.4.1) #>  statnet.common         4.9.0     2023-05-24 [1] RSPM (R 4.4.0) #>  stringi                1.8.4     2024-05-06 [2] RSPM (R 4.4.0) #>  stringr                1.5.1     2023-11-14 [2] RSPM (R 4.4.0) #>  SummarizedExperiment   1.35.2    2024-09-27 [1] Bioconductor 3.20 (R 4.4.1) #>  syntenet             * 1.7.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  systemfonts            1.1.0     2024-05-15 [2] RSPM (R 4.4.0) #>  textshaping            0.4.0     2024-05-24 [2] RSPM (R 4.4.0) #>  tibble                 3.2.1     2023-03-20 [2] RSPM (R 4.4.0) #>  tidyr                  1.3.1     2024-01-24 [1] RSPM (R 4.4.0) #>  tidyselect             1.2.1     2024-03-11 [1] RSPM (R 4.4.0) #>  txdbmaker            * 1.1.1     2024-06-20 [1] Bioconductor 3.20 (R 4.4.0) #>  UCSC.utils             1.1.0     2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  utf8                   1.2.4     2023-10-22 [2] RSPM (R 4.4.0) #>  vctrs                  0.6.5     2023-12-01 [2] RSPM (R 4.4.0) #>  withr                  3.0.1     2024-07-31 [2] RSPM (R 4.4.0) #>  xfun                   0.47      2024-08-17 [2] RSPM (R 4.4.0) #>  XML                    3.99-0.17 2024-06-25 [1] RSPM (R 4.4.0) #>  xml2                   1.3.6     2023-12-04 [2] RSPM (R 4.4.0) #>  XVector                0.45.0    2024-05-01 [1] Bioconductor 3.20 (R 4.4.0) #>  yaml                   2.3.10    2024-07-26 [2] RSPM (R 4.4.0) #>  zlibbioc               1.51.1    2024-06-05 [1] Bioconductor 3.20 (R 4.4.0) #>  #>  [1] /__w/_temp/Library #>  [2] /usr/local/lib/R/site-library #>  [3] /usr/local/lib/R/library #>  #> ──────────────────────────────────────────────────────────────────────────────"},{"path":[]},{"path":"/authors.html","id":null,"dir":"","previous_headings":"","what":"Authors","title":"Authors and Citation","text":"Fabrício Almeida-Silva. Author, maintainer. Yves Van de Peer. Author.","code":""},{"path":"/authors.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Authors and Citation","text":"Almeida-Silva F, Van de Peer Y (2024). doubletrouble: Identification classification duplicated genes. R package version 1.5.2, https://github.com/almeidasilvaf/doubletrouble.","code":"@Manual{,   title = {doubletrouble: Identification and classification of duplicated genes},   author = {Fabrício Almeida-Silva and Yves {Van de Peer}},   year = {2024},   note = {R package version 1.5.2},   url = {https://github.com/almeidasilvaf/doubletrouble}, }"},{"path":"/index.html","id":"doubletrouble-","dir":"","previous_headings":"","what":"Identification and classification of duplicated genes","title":"Identification and classification of duplicated genes","text":"major goal doubletrouble identify duplicated genes whole-genome protein sequences classify based modes duplication. Duplicates can classified using four different classification schemes, increase complexity level details stepwise manner. classification schemes duplication modes can classify : Legend: SD, segmental duplication. SSD, small-scale duplication. TD, tandem duplication. PD, proximal duplication. TRD, transposon-derived duplication. rTRD, retrotransposon-derived duplication. dTRD, DNA transposon-derived duplication. DD, dispersed duplication. Besides classifying gene pairs, users can also classify genes, gene assigned unique mode duplication. Users can also calculate substitution rates per substitution site (.e., KaK_a, KsK_s ratios KaKs\\frac{K_a}{K_s}) duplicate pairs, find peaks Ks distributions Gaussian Mixture Models (GMMs), classify gene pairs age groups based Ks peaks.","code":""},{"path":"/index.html","id":"installation-instructions","dir":"","previous_headings":"","what":"Installation instructions","title":"Identification and classification of duplicated genes","text":"Get latest stable R release CRAN. install doubletrouble Bioconductor using following code: development version GitHub :","code":"if (!requireNamespace(\"BiocManager\", quietly = TRUE)) {     install.packages(\"BiocManager\") }  BiocManager::install(\"doubletrouble\") BiocManager::install(\"almeidasilvaf/doubletrouble\")"},{"path":"/index.html","id":"citation","dir":"","previous_headings":"","what":"Citation","title":"Identification and classification of duplicated genes","text":"citation output using citation('doubletrouble') R. Please run check updates cite doubletrouble. Please note doubletrouble made possible thanks many R bioinformatics software authors, cited either vignettes /paper(s) describing package.","code":"print(citation('doubletrouble'), bibtex = TRUE) #> To cite package 'doubletrouble' in publications use: #>  #>   Almeida-Silva F, Van de Peer Y (2022). _doubletrouble: Identification #>   and classification of duplicated genes_. R package version 1.3.0, #>   <https://github.com/almeidasilvaf/doubletrouble>. #>  #> A BibTeX entry for LaTeX users is #>  #>   @Manual{, #>     title = {doubletrouble: Identification and classification of duplicated genes}, #>     author = {Fabrício Almeida-Silva and Yves {Van de Peer}}, #>     year = {2022}, #>     note = {R package version 1.3.0}, #>     url = {https://github.com/almeidasilvaf/doubletrouble}, #>   }"},{"path":"/index.html","id":"code-of-conduct","dir":"","previous_headings":"","what":"Code of Conduct","title":"Identification and classification of duplicated genes","text":"Please note doubletrouble project released Contributor Code Conduct. contributing project, agree abide terms.","code":""},{"path":"/index.html","id":"development-tools","dir":"","previous_headings":"","what":"Development tools","title":"Identification and classification of duplicated genes","text":"Continuous code testing possible thanks GitHub actions usethis, remotes, rcmdcheck customized use Bioconductor’s docker containers BiocCheck. Code coverage assessment possible thanks codecov covr. documentation website automatically updated thanks pkgdown. code styled automatically thanks styler. documentation formatted thanks devtools roxygen2. details, check dev directory. package developed using biocthis.","code":""},{"path":"/reference/cds_scerevisiae.html","id":null,"dir":"Reference","previous_headings":"","what":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"Data obtained Ensembl Fungi, CDS primary transcripts included.","code":""},{"path":"/reference/cds_scerevisiae.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"","code":"data(cds_scerevisiae)"},{"path":"/reference/cds_scerevisiae.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"DNAStringSet object CDS S. cerevisiae.","code":""},{"path":"/reference/cds_scerevisiae.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Coding sequences (CDS) of S. cerevisiae — cds_scerevisiae","text":"","code":"data(cds_scerevisiae)"},{"path":"/reference/classify_gene_pairs.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"Classify duplicate gene pairs based modes duplication","code":""},{"path":"/reference/classify_gene_pairs.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"","code":"classify_gene_pairs(   annotation = NULL,   blast_list = NULL,   scheme = \"standard\",   blast_inter = NULL,   intron_counts,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   proximal_max = 10,   collinearity_dir = NULL )"},{"path":"/reference/classify_gene_pairs.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). blast_list list data frames containing BLAST tabular output intraspecies comparisons. list element corresponds BLAST output given species, names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). scheme Character indicating classification scheme use. One \"binary\", \"standard\", \"extended\", \"full\". See details information scheme means. Default: \"standard\". blast_inter (valid scheme == \"extended\" \"full\"). list data frames containing BLAST tabular output comparison target species outgroups. Names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). intron_counts (valid scheme == \"full\"). list 2-column data frames number introns per gene returned get_intron_counts(). Names list elements must match names annotation. evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. proximal_max Numeric scalar maximum distance (number genes) two genes consider proximal duplicates. Default: 10. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/classify_gene_pairs.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"list 3-column data frames duplicated gene pairs (columns 1 2), modes duplication (column 3).","code":""},{"path":"/reference/classify_gene_pairs.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"classification schemes increase complexity (number classes) order 'binary', 'standard', 'extended', 'full'. classification scheme \"binary\", duplicates classified one 'SD' (segmental duplications) 'SSD' (small-scale duplications). classification scheme \"standard\" (default), duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'DD' (dispersed duplication). classification scheme \"extended\", duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'TRD' (transposon-derived duplication), 'DD' (dispersed duplication). Finally, classification scheme \"full\", duplicates classified 'SD' (segmental duplication), 'TD' (tandem duplication), 'PD' (proximal duplication), 'rTRD' (retrotransposon-derived duplication), 'dTRD' (DNA transposon-derived duplication), 'DD' (dispersed duplication).","code":""},{"path":"/reference/classify_gene_pairs.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify duplicate gene pairs based on their modes of duplication — classify_gene_pairs","text":"","code":"# Load example data data(diamond_intra) data(diamond_inter) data(yeast_annot) data(yeast_seq)  # Get processed annotation data annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation  # Get list of intron counts library(txdbmaker) #> Loading required package: BiocGenerics #>  #> Attaching package: ‘BiocGenerics’ #> The following objects are masked from ‘package:stats’: #>  #>     IQR, mad, sd, var, xtabs #> The following objects are masked from ‘package:base’: #>  #>     Filter, Find, Map, Position, Reduce, anyDuplicated, aperm, append, #>     as.data.frame, basename, cbind, colnames, dirname, do.call, #>     duplicated, eval, evalq, get, grep, grepl, intersect, is.unsorted, #>     lapply, mapply, match, mget, order, paste, pmax, pmax.int, pmin, #>     pmin.int, rank, rbind, rownames, sapply, saveRDS, setdiff, table, #>     tapply, union, unique, unsplit, which.max, which.min #> Loading required package: S4Vectors #> Loading required package: stats4 #>  #> Attaching package: ‘S4Vectors’ #> The following object is masked from ‘package:utils’: #>  #>     findMatches #> The following objects are masked from ‘package:base’: #>  #>     I, expand.grid, unname #> Loading required package: GenomeInfoDb #> Loading required package: IRanges #> Loading required package: GenomicRanges #> Loading required package: GenomicFeatures #> Loading required package: AnnotationDbi #> Loading required package: Biobase #> Welcome to Bioconductor #>  #>     Vignettes contain introductory material; view with #>     'browseVignettes()'. To cite Bioconductor, see #>     'citation(\"Biobase\")', and for packages 'citation(\"pkgname\")'. #>  #> Attaching package: ‘txdbmaker’ #> The following objects are masked from ‘package:GenomicFeatures’: #>  #>     UCSCFeatureDbTableSchema, browseUCSCtrack, getChromInfoFromBiomart, #>     makeFDbPackageFromUCSC, makeFeatureDbFromUCSC, makePackageName, #>     makeTxDb, makeTxDbFromBiomart, makeTxDbFromEnsembl, #>     makeTxDbFromGFF, makeTxDbFromGRanges, makeTxDbFromUCSC, #>     makeTxDbPackage, makeTxDbPackageFromBiomart, #>     makeTxDbPackageFromUCSC, supportedMiRBaseBuildValues, #>     supportedUCSCFeatureDbTables, supportedUCSCFeatureDbTracks, #>     supportedUCSCtables txdb_list <- lapply(yeast_annot, txdbmaker::makeTxDbFromGRanges) intron_counts <- lapply(txdb_list, get_intron_counts)  # Classify duplicates - full scheme dup_class <- classify_gene_pairs(     annotation = annotation,      blast_list = diamond_intra,      scheme = \"full\",     blast_inter = diamond_inter,      intron_counts = intron_counts )  # Check number of gene pairs per class table(dup_class$Scerevisiae$type) #>  #>   SD   TD   PD rTRD dTRD   DD  #>  342   42   80   52  963 2109"},{"path":"/reference/classify_genes.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify genes into unique modes of duplication — classify_genes","title":"Classify genes into unique modes of duplication — classify_genes","text":"Classify genes unique modes duplication","code":""},{"path":"/reference/classify_genes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify genes into unique modes of duplication — classify_genes","text":"","code":"classify_genes(gene_pairs_list = NULL)"},{"path":"/reference/classify_genes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify genes into unique modes of duplication — classify_genes","text":"gene_pairs_list List classified gene pairs returned classify_gene_pairs().","code":""},{"path":"/reference/classify_genes.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify genes into unique modes of duplication — classify_genes","text":"list 2-column data frames variables gene type representing gene ID duplication type, respectively.","code":""},{"path":"/reference/classify_genes.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Classify genes into unique modes of duplication — classify_genes","text":"gene present pairs different duplication modes, gene classified unique mode duplication following order priority indicated levels factor type. scheme \"binary\", order SD > SSD. scheme \"standard\", order SD > TD > PD > DD. scheme \"extended\", order SD > TD > PD > TRD > DD. scheme \"full\", order SD > TD > PD > rTRD > dTRD > DD.","code":""},{"path":"/reference/classify_genes.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify genes into unique modes of duplication — classify_genes","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  cols <- c(\"dup1\", \"dup2\", \"type\") gene_pairs_list <- list(Scerevisiae = scerevisiae_kaks[, cols])  class_genes <- classify_genes(gene_pairs_list)"},{"path":"/reference/diamond_inter.html","id":null,"dir":"Reference","previous_headings":"","what":"Interspecies DIAMOND output for yeast species — diamond_inter","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"list contains similarity search S. cerevisiae C. glabrata, obtained run_diamond().","code":""},{"path":"/reference/diamond_inter.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"","code":"data(diamond_inter)"},{"path":"/reference/diamond_inter.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"list data frames (length 1) containing output DIAMOND search S. cerevisiae C. glabrata (outgroup).","code":""},{"path":"/reference/diamond_inter.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Interspecies DIAMOND output for yeast species — diamond_inter","text":"","code":"data(diamond_inter)"},{"path":"/reference/diamond_intra.html","id":null,"dir":"Reference","previous_headings":"","what":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"List obtained run_diamond().","code":""},{"path":"/reference/diamond_intra.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"","code":"data(diamond_intra)"},{"path":"/reference/diamond_intra.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"list data frames (length 1) containing whole paranome S. cerevisiae resulting intragenome similarity searches.","code":""},{"path":"/reference/diamond_intra.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Intraspecies DIAMOND output for S. cerevisiae — diamond_intra","text":"","code":"data(diamond_intra)"},{"path":"/reference/duplicates2counts.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a duplicate count matrix for each genome — duplicates2counts","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"Get duplicate count matrix genome","code":""},{"path":"/reference/duplicates2counts.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"","code":"duplicates2counts(duplicate_list, shape = \"long\")"},{"path":"/reference/duplicates2counts.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"duplicate_list list data frames duplicated genes gene pairs modes duplication returned classify_gene_pairs() classify_genes(). shape Character specifying shape output data frame. One \"long\" (data frame long shape, tidyverse sense), \"wide\" (data frame wide shape, tidyverse sense). Default: \"long\".","code":""},{"path":"/reference/duplicates2counts.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"shape = \"wide\", count matrix containing frequency duplicated genes (gene pairs) mode species, species rows duplication modes columns. shape = \"long\", data frame long format following variables: type Factor, type duplication. n Numeric, number duplicates. species Character, species name","code":""},{"path":"/reference/duplicates2counts.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a duplicate count matrix for each genome — duplicates2counts","text":"","code":"data(fungi_kaks)  # Get unique duplicates duplicate_list <- classify_genes(fungi_kaks)  # Get count table counts <- duplicates2counts(duplicate_list)"},{"path":"/reference/find_ks_peaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"Find peaks Ks distribution Gaussian Mixture Models","code":""},{"path":"/reference/find_ks_peaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"","code":"find_ks_peaks(ks, npeaks = 2, min_ks = 0.01, max_ks = 4, verbose = FALSE)"},{"path":"/reference/find_ks_peaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"ks numeric vector Ks values. npeaks Numeric scalar indicating number peaks Ks distribution. know many peaks , can include range values, number peaks produces lowest BIC (Bayesian Information Criterion) selected optimal. Default: 2. min_ks Numeric scalar minimum Ks value. Removing small Ks values generally used avoid incorporation allelic /splice variants prevent fitting component infinity. Default: 0.01. max_ks Numeric scalar indicating maximum Ks value. Removing large Ks values usually performed account Ks saturation. Default: 4. verbose Logical indicating messages printed screen. Default: FALSE.","code":""},{"path":"/reference/find_ks_peaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"list following elements: mean Numeric estimated means. sd Numeric estimated standard deviations. lambda Numeric estimated mixture weights. ks Numeric vector filtered Ks distribution based arguments passed min_ks max_ks.","code":""},{"path":"/reference/find_ks_peaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Find peaks in a Ks distribution with Gaussian Mixture Models — find_ks_peaks","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae ks <- scerevisiae_kaks$Ks  # Find 2 peaks in Ks distribution peaks <- find_ks_peaks(ks, npeaks = 2)  # From 2 to 4 peaks, verbose = TRUE to show BIC values peaks <- find_ks_peaks(ks, npeaks = c(2, 3, 4), verbose = TRUE) #> Optimal number of peaks: 4 #> Bayesian Information Criterion (BIC):  #>           E         V #> 2 -4833.369 -4312.906 #> 3 -4109.263 -3625.427 #> 4 -4124.051 -3397.111 #>  #> Top 3 models based on the BIC criterion:  #>       V,4       V,3       E,3  #> -3397.111 -3625.427 -4109.263"},{"path":"/reference/fungi_kaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"data set obtained classify_gene_pairs() followed pairs2kaks().","code":""},{"path":"/reference/fungi_kaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"","code":"data(fungi_kaks)"},{"path":"/reference/fungi_kaks.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"list data frame elements named saccharomyces_cerevisiae, candida_glabrata, schizosaccharomyces_pombe. data frame contains following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. Ka Numeric, Ka values. Ks Numeric, Ks values. Ka_Ks Numeric, Ka/Ks values. type Character, mode duplication","code":""},{"path":"/reference/fungi_kaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Duplicate pairs and Ka, Ks, and Ka/Ks values for fungi species — fungi_kaks","text":"","code":"data(fungi_kaks)"},{"path":"/reference/get_anchors_list.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a list of anchor pairs for each species — get_anchors_list","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"Get list anchor pairs species","code":""},{"path":"/reference/get_anchors_list.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"","code":"get_anchors_list(   blast_list = NULL,   annotation = NULL,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   collinearity_dir = NULL )"},{"path":"/reference/get_anchors_list.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"blast_list list data frames containing BLAST tabular output intraspecies comparisons. list element corresponds BLAST output given species, names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned process_input(). annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/get_anchors_list.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"list data frames representing intraspecies anchor pairs.","code":""},{"path":"/reference/get_anchors_list.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a list of anchor pairs for each species — get_anchors_list","text":"","code":"data(diamond_intra) data(yeast_annot) data(yeast_seq) blast_list <- diamond_intra  # Get processed annotation for S. cerevisiae annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation  # Get list of intraspecies anchor pairs anchorpairs <- get_anchors_list(blast_list, annotation)"},{"path":"/reference/get_intron_counts.html","id":null,"dir":"Reference","previous_headings":"","what":"Get a data frame of intron counts per gene — get_intron_counts","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"Get data frame intron counts per gene","code":""},{"path":"/reference/get_intron_counts.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"","code":"get_intron_counts(txdb)"},{"path":"/reference/get_intron_counts.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"txdb TxDb object transcript annotations. See details examples create TxDb objects different kinds input.","code":""},{"path":"/reference/get_intron_counts.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"data frame intron counts per gene, variables: gene Character gene IDs. introns Numeric number introns per gene.","code":""},{"path":"/reference/get_intron_counts.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"family functions makeTxDbFrom* txdbmaker package can used create TxDb objects variety input data types. can create TxDb objects e.g., GRanges objects (makeTxDbFromGRanges()), GFF files (makeTxDbFromGFF()), Ensembl database (makeTxDbFromEnsembl), Biomart database (makeTxDbFromBiomart).","code":""},{"path":"/reference/get_intron_counts.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Get a data frame of intron counts per gene — get_intron_counts","text":"","code":"data(yeast_annot)  # Create TxDb object from GRanges library(txdbmaker) txdb <- txdbmaker::makeTxDbFromGRanges(yeast_annot[[1]])  # Get intron counts intron_counts <- get_intron_counts(txdb)"},{"path":"/reference/get_segmental.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs derived from segmental duplications — get_segmental","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"Classify gene pairs derived segmental duplications","code":""},{"path":"/reference/get_segmental.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"","code":"get_segmental(anchor_pairs = NULL, pairs = NULL)"},{"path":"/reference/get_segmental.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"anchor_pairs 2-column data frame anchor pairs columns 1 2. pairs 2-column data frame duplicate pairs. equivalent first 2 columns tabular output BLAST-like programs.","code":""},{"path":"/reference/get_segmental.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"3-column data frame variables: dup1 Character, duplicated gene 1 dup2 Character, duplicated gene 2 type Factor indicating duplication types, levels \"SD\" (segmental duplication) \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_segmental.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs derived from segmental duplications — get_segmental","text":"","code":"data(diamond_intra) data(yeast_annot) data(yeast_seq) blast_list <- diamond_intra  # Get processed annotation for S. cerevisiae annotation <- syntenet::process_input(yeast_seq, yeast_annot)$annotation[1]  # Get list of intraspecies anchor pairs anchor_pairs <- get_anchors_list(blast_list, annotation) anchor_pairs <- anchor_pairs[[1]][, c(1, 2)]  # Get duplicate pairs from DIAMOND output duplicates <- diamond_intra[[1]][, c(1, 2)] dups <- get_segmental(anchor_pairs, duplicates)"},{"path":"/reference/get_tandem_proximal.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"Classify gene pairs derived tandem proximal duplications","code":""},{"path":"/reference/get_tandem_proximal.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"","code":"get_tandem_proximal(pairs = NULL, annotation_granges = NULL, proximal_max = 10)"},{"path":"/reference/get_tandem_proximal.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_segmental(). annotation_granges processed GRanges object element list returned syntenet::process_input(). proximal_max Numeric scalar maximum distance (number genes) two genes consider proximal duplicates. Default: 10.","code":""},{"path":"/reference/get_tandem_proximal.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"3-column data frame variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_tandem_proximal.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs derived from tandem and proximal duplications — get_tandem_proximal","text":"","code":"data(yeast_annot) data(yeast_seq) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation for S. cerevisiae pdata <- annotation <- syntenet::process_input(yeast_seq, yeast_annot) annot <- pdata$annotation[[1]]  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Get tandem and proximal duplicates td_pd_pairs <- get_tandem_proximal(pairs, annot)"},{"path":"/reference/get_transposed.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify gene pairs originating from transposon-derived duplications — get_transposed","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"Classify gene pairs originating transposon-derived duplications","code":""},{"path":"/reference/get_transposed.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"","code":"get_transposed(   pairs,   blast_inter,   annotation,   evalue = 1e-10,   anchors = 5,   max_gaps = 25,   collinearity_dir = NULL )"},{"path":"/reference/get_transposed.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_tandem_proximal(). blast_inter list data frames length 1 containing BLAST tabular output comparison target species outgroup. Names list elements must match names list elements annotation. BLASTp, DIAMOND simular programs must run processed sequence data returned syntenet::process_input(). annotation processed GRangesList CompressedGRangesList object returned syntenet::process_input(). evalue Numeric scalar indicating E-value threshold. Default: 1e-10. anchors Numeric indicating minimum required number genes call syntenic block, syntenet::infer_syntenet. Default: 5. max_gaps Numeric indicating number upstream downstream genes search anchors, syntenet::infer_syntenet. Default: 25. collinearity_dir Character indicating path directory .collinearity files stored. NULL, files stored subdirectory tempdir(). Default: NULL.","code":""},{"path":"/reference/get_transposed.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"3-column data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"TRD\" (transposon-derived duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_transposed.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify gene pairs originating from transposon-derived duplications — get_transposed","text":"","code":"data(diamond_inter) data(diamond_intra) data(yeast_seq) data(yeast_annot) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation pdata <- syntenet::process_input(yeast_seq, yeast_annot) annotation <- pdata$annotation  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Classify pairs trd <- get_transposed(pairs, diamond_inter, annotation)"},{"path":"/reference/get_transposed_classes.html","id":null,"dir":"Reference","previous_headings":"","what":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"Classify TRD genes derived either DNA transposons retrotransposons","code":""},{"path":"/reference/get_transposed_classes.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"","code":"get_transposed_classes(pairs, intron_counts)"},{"path":"/reference/get_transposed_classes.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"pairs 3-column data frame columns dup1, dup2, type indicating duplicated gene 1, duplicated gene 2, mode duplication associated pair. data frame returned get_transposed(). intron_counts 2-column data frame columns gene introns indicating number introns gene, returned get_intron_counts.","code":""},{"path":"/reference/get_transposed_classes.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"3-column data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. type Factor duplication types, levels \"SD\" (segmental duplication), \"TD\" (tandem duplication), \"PD\" (proximal duplication), \"dTRD\" (DNA transposon-derived duplication), \"rTRD\" (retrotransposon-derived duplication), \"DD\" (dispersed duplication).","code":""},{"path":"/reference/get_transposed_classes.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Classify TRD genes as derived from either DNA transposons or retrotransposons — get_transposed_classes","text":"","code":"data(diamond_inter) data(diamond_intra) data(yeast_seq) data(yeast_annot) data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Get processed annotation pdata <- syntenet::process_input(yeast_seq, yeast_annot) annotation <- pdata$annotation  # Get duplicated pairs pairs <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"type\")] pairs$dup1 <- paste0(\"Sce_\", pairs$dup1) pairs$dup2 <- paste0(\"Sce_\", pairs$dup2)  # Classify pairs trd <- get_transposed(pairs, diamond_inter, annotation)  # Create TxDb object from GRanges library(txdbmaker) txdb <- txdbmaker::makeTxDbFromGRanges(yeast_annot[[1]])  # Get intron counts intron_counts <- get_intron_counts(txdb)  # Get TRD classes trd_classes <- get_transposed_classes(trd, intron_counts)"},{"path":"/reference/gmax_ks.html","id":null,"dir":"Reference","previous_headings":"","what":"Duplicate pairs and Ks values for Glycine max — gmax_ks","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"data set obtained classify_gene_pairs() followed pairs2kaks().","code":""},{"path":"/reference/gmax_ks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"","code":"data(gmax_ks)"},{"path":"/reference/gmax_ks.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"data frame following variables: dup1 Character, duplicated gene 1. dup2 Character, duplicated gene 2. Ks Numeric, Ks values. type Factor, duplication mode.","code":""},{"path":"/reference/gmax_ks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Duplicate pairs and Ks values for Glycine max — gmax_ks","text":"","code":"data(gmax_ks)"},{"path":"/reference/pairs2kaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"Calculate Ka, Ks, Ka/Ks duplicate gene pairs","code":""},{"path":"/reference/pairs2kaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"","code":"pairs2kaks(gene_pairs_list, cds, model = \"MYN\", threads = 1, verbose = FALSE)"},{"path":"/reference/pairs2kaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"gene_pairs_list List data frames containing duplicated gene pairs returned classify_gene_pairs(). cds List DNAStringSet objects containing coding sequences gene. model Character scalar indicating codon model use. Possible values \"Li\", \"NG86\", \"NG\", \"LWL\", \"LPB\", \"MLWL\", \"MLPB\", \"GY\", \"YN\", \"MYN\", \"MS\", \"MA\", \"GNG\", \"GLWL\", \"GLPB\", \"GMLWL\", \"GMLPB\", \"GYN\", \"GMYN\". Default: \"MYN\". threads Numeric indicating number threads use. Default: 1. verbose Logical indicating whether progress messages printed screen. Default: FALSE.","code":""},{"path":"/reference/pairs2kaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"list data frames containing gene pairs Ka, Ks, Ka/Ks values.","code":""},{"path":"/reference/pairs2kaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Calculate Ka, Ks, and Ka/Ks from duplicate gene pairs — pairs2kaks","text":"","code":"data(diamond_intra) data(diamond_inter) data(yeast_annot) data(yeast_seq) data(cds_scerevisiae) blast_list <- diamond_intra blast_inter <- diamond_inter  pdata <- syntenet::process_input(yeast_seq, yeast_annot) annot <- pdata$annotation[\"Scerevisiae\"]  # Binary classification scheme pairs <- classify_gene_pairs(annot, blast_list) td_pairs <- pairs[[1]][pairs[[1]]$type == \"TD\", ] gene_pairs_list <- list(     Scerevisiae = td_pairs[seq(1, 3, by = 1), ] )  cds <- list(Scerevisiae = cds_scerevisiae)  kaks <- pairs2kaks(gene_pairs_list, cds)"},{"path":"/reference/plot_duplicate_freqs.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"Plot frequency duplicates per mode species","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"","code":"plot_duplicate_freqs(dup_counts, plot_type = \"facet\", remove_zero = TRUE)"},{"path":"/reference/plot_duplicate_freqs.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"dup_counts data frame long format number duplicates per mode species, returned function duplicates2counts. plot_type Character indicating plot frequencies. One 'facet' (facets level variable type), 'stack' (levels variable type stacked bars), 'stack_percent' (levels variable type stacked bars, x-axis representing relative frequencies). Default: 'facet'. remove_zero Logical indicating whether remove rows zero values. Default: TRUE.","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"ggplot object.","code":""},{"path":"/reference/plot_duplicate_freqs.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot frequency of duplicates per mode for each species — plot_duplicate_freqs","text":"","code":"data(fungi_kaks)  # Get unique duplicates duplicate_list <- classify_genes(fungi_kaks)  # Get count table dup_counts <- duplicates2counts(duplicate_list)  # Plot counts plot_duplicate_freqs(dup_counts, plot_type = \"stack_percent\")"},{"path":"/reference/plot_ks_distro.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"Plot distribution synonymous substitution rates (Ks)","code":""},{"path":"/reference/plot_ks_distro.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"","code":"plot_ks_distro(   ks_df,   min_ks = 0.01,   max_ks = 2,   bytype = FALSE,   type_levels = NULL,   plot_type = \"histogram\",   binwidth = 0.03 )"},{"path":"/reference/plot_ks_distro.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"ks_df data frame Ks values gene pair returned pairs2kaks(). min_ks Numeric indicating minimum Ks value keep. Default: 0.01. max_ks Numeric indicating maximum Ks value keep. Default: 2. bytype Logical indicating whether plot distribution type duplication (requires column named type). type_levels (valid bytype NULL) Character indicating levels variable specified parameter group_by kept. default, levels kept. plot_type Character indicating type plot create. bytype = TRUE, possible types \"histogram\" \"violin\". bytype = FALSE, possible types \"histogram\", \"density\", \"density_histogram\". Default: \"histogram\". binwidth (valid plot_type = \"histogram\") Numeric indicating bin width. Default: 0.03.","code":""},{"path":"/reference/plot_ks_distro.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"ggplot object.","code":""},{"path":"/reference/plot_ks_distro.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot distribution of synonymous substitution rates (Ks) — plot_ks_distro","text":"","code":"data(fungi_kaks) ks_df <- fungi_kaks$saccharomyces_cerevisiae  # Plot distro plot_ks_distro(ks_df, bytype = TRUE)"},{"path":"/reference/plot_ks_peaks.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"Plot histogram Ks distribution peaks","code":""},{"path":"/reference/plot_ks_peaks.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"","code":"plot_ks_peaks(peaks = NULL, binwidth = 0.05)"},{"path":"/reference/plot_ks_peaks.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"peaks list elements mean, sd, lambda, ks, returned function fins_ks_peaks(). binwidth Numeric scalar binwidth histogram. Default: 0.05.","code":""},{"path":"/reference/plot_ks_peaks.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"ggplot object histogram lines Ks peak.","code":""},{"path":"/reference/plot_ks_peaks.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot histogram of Ks distribution with peaks — plot_ks_peaks","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae ks <- scerevisiae_kaks$Ks  # Find 2 peaks in Ks distribution peaks <- find_ks_peaks(ks, npeaks = 2)  # Plot plot_ks_peaks(peaks, binwidth = 0.05)"},{"path":"/reference/plot_rates_by_species.html","id":null,"dir":"Reference","previous_headings":"","what":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"Plot distributions substitution rates (Ka, Ks, Ka/Ks) per species","code":""},{"path":"/reference/plot_rates_by_species.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"","code":"plot_rates_by_species(   kaks_list,   rate_column = \"Ks\",   bytype = FALSE,   range = c(0, 2),   fill = \"deepskyblue3\",   color = \"deepskyblue4\" )"},{"path":"/reference/plot_rates_by_species.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"kaks_list list data frames substitution rates per gene pair species returned pairs2kaks(). rate_column Character indicating name column plot. Default: \"Ks\". bytype Logical indicating whether show distributions type duplication. Default: FALSE. range Numeric vector length 2 indicating minimum maximum values plot. Default: c(0, 2). fill Character color use fill aesthetic. Ignored bytype = TRUE. Default: \"deepskyblue3\". color Character color use color aesthetic. Ignored bytype = FALSE. Default: \"deepskyblue4\".","code":""},{"path":"/reference/plot_rates_by_species.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"ggplot object.","code":""},{"path":"/reference/plot_rates_by_species.html","id":"details","dir":"Reference","previous_headings":"","what":"Details","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"Data plotted using species order list. change order species plot, reorder list elements kaks_list.","code":""},{"path":"/reference/plot_rates_by_species.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Plot distributions of substitution rates (Ka, Ks, or Ka/Ks) per species — plot_rates_by_species","text":"","code":"data(fungi_kaks)  # Plot rates plot_rates_by_species(fungi_kaks, rate_column = \"Ka_Ks\")"},{"path":"/reference/split_pairs_by_peak.html","id":null,"dir":"Reference","previous_headings":"","what":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"purpose function classify gene pairs age 2+ Ks peaks. way, newer gene pairs found within certain number standard deviations highest peak, older genes found close within smaller peaks.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"","code":"split_pairs_by_peak(ks_df, peaks, nsd = 2, binwidth = 0.05)"},{"path":"/reference/split_pairs_by_peak.html","id":"arguments","dir":"Reference","previous_headings":"","what":"Arguments","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"ks_df 3-column data frame gene pairs columns 1 2, Ks values gene pair column 3. peaks list mean, standard deviation, amplitude Ks peaks generated find_ks_peaks. nsd Numeric number standard deviations consider peak. binwidth Numeric scalar binwidth histogram. Default: 0.05.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"value","dir":"Reference","previous_headings":"","what":"Value","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"list following elements: pairs 4-column data frame variables dup1 (character), dup2 (character), ks (numeric), peak (numeric), representing duplicate gene pair, Ks values, peak ID, respectively. plot ggplot object Ks peaks returned plot_ks_peaks, dashed red lines indicating boundaries peak.","code":""},{"path":"/reference/split_pairs_by_peak.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Split gene pairs based on their Ks peaks — split_pairs_by_peak","text":"","code":"data(fungi_kaks) scerevisiae_kaks <- fungi_kaks$saccharomyces_cerevisiae  # Create a data frame of duplicate pairs and Ks values ks_df <- scerevisiae_kaks[, c(\"dup1\", \"dup2\", \"Ks\")]  # Create list of peaks peaks <- find_ks_peaks(ks_df$Ks, npeaks = 2)  # Split pairs spairs <- split_pairs_by_peak(ks_df, peaks)"},{"path":"/reference/yeast_annot.html","id":null,"dir":"Reference","previous_headings":"","what":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"Data obtained Ensembl Fungi. annotation data protein-coding genes (associated mRNA, exons, CDS, etc) included.","code":""},{"path":"/reference/yeast_annot.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"","code":"data(yeast_annot)"},{"path":"/reference/yeast_annot.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"CompressedGRangesList containing elements Scerevisiae Cglabrata.","code":""},{"path":"/reference/yeast_annot.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Genome annotation of the yeast species S. cerevisiae and C. glabrata — yeast_annot","text":"","code":"data(yeast_annot)"},{"path":"/reference/yeast_seq.html","id":null,"dir":"Reference","previous_headings":"","what":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"Data obtained Ensembl Fungi. translated sequences primary transcripts included.","code":""},{"path":"/reference/yeast_seq.html","id":"ref-usage","dir":"Reference","previous_headings":"","what":"Usage","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"","code":"data(yeast_seq)"},{"path":"/reference/yeast_seq.html","id":"format","dir":"Reference","previous_headings":"","what":"Format","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"list AAStringSet objects elements Scerevisiae Cglabrata.","code":""},{"path":"/reference/yeast_seq.html","id":"ref-examples","dir":"Reference","previous_headings":"","what":"Examples","title":"Protein sequences of the yeast species S. cerevisiae and C. glabrata — yeast_seq","text":"","code":"data(yeast_seq)"},{"path":"/news/index.html","id":"doubletrouble-0990","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.0","title":"doubletrouble 0.99.0","text":"NEW FEATURES Added NEWS.md file track changes package.","code":""},{"path":"/news/index.html","id":"doubletrouble-0992","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.2","title":"doubletrouble 0.99.2","text":"CHANGES Small change coding style Bioconductor peer-review (m:n replaced c(m, n) seq(m,n))","code":""},{"path":"/news/index.html","id":"doubletrouble-0993","dir":"Changelog","previous_headings":"","what":"doubletrouble 0.99.3","title":"doubletrouble 0.99.3","text":"BUG FIXES Updated functions (e.g., get_anchor_list(), collinearity2blocks()) update syntenet.","code":""}]

Scheme	Duplication modes
binary	SD, SSD
standard	SD, TD, PD, DD
extended	SD, TD, PD, TRD, DD
full	SD, TD, PD, rTRD, dTRD, DD