diff --git a/joss.06062/10.21105.joss.06062.crossref.xml b/joss.06062/10.21105.joss.06062.crossref.xml
new file mode 100644
index 0000000000..028fdad06f
--- /dev/null
+++ b/joss.06062/10.21105.joss.06062.crossref.xml
@@ -0,0 +1,445 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<doi_batch xmlns="http://www.crossref.org/schema/5.3.1"
+           xmlns:ai="http://www.crossref.org/AccessIndicators.xsd"
+           xmlns:rel="http://www.crossref.org/relations.xsd"
+           xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+           version="5.3.1"
+           xsi:schemaLocation="http://www.crossref.org/schema/5.3.1 http://www.crossref.org/schemas/crossref5.3.1.xsd">
+  <head>
+    <doi_batch_id>20240325T090939-2222b389c1b6b872836c818c252b79933a5735e5</doi_batch_id>
+    <timestamp>20240325090939</timestamp>
+    <depositor>
+      <depositor_name>JOSS Admin</depositor_name>
+      <email_address>admin@theoj.org</email_address>
+    </depositor>
+    <registrant>The Open Journal</registrant>
+  </head>
+  <body>
+    <journal>
+      <journal_metadata>
+        <full_title>Journal of Open Source Software</full_title>
+        <abbrev_title>JOSS</abbrev_title>
+        <issn media_type="electronic">2475-9066</issn>
+        <doi_data>
+          <doi>10.21105/joss</doi>
+          <resource>https://joss.theoj.org</resource>
+        </doi_data>
+      </journal_metadata>
+      <journal_issue>
+        <publication_date media_type="online">
+          <month>03</month>
+          <year>2024</year>
+        </publication_date>
+        <journal_volume>
+          <volume>9</volume>
+        </journal_volume>
+        <issue>95</issue>
+      </journal_issue>
+      <journal_article publication_type="full_text">
+        <titles>
+          <title>Acanthophis: a comprehensive plant hologenomics
+pipeline</title>
+        </titles>
+        <contributors>
+          <person_name sequence="first" contributor_role="author">
+            <given_name>Kevin D.</given_name>
+            <surname>Murray</surname>
+            <ORCID>https://orcid.org/0000-0002-2466-1917</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Justin O.</given_name>
+            <surname>Borevitz</surname>
+            <ORCID>https://orcid.org/0000-0001-8408-3699</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Detlef</given_name>
+            <surname>Weigel</surname>
+            <ORCID>https://orcid.org/0000-0002-2114-7963</ORCID>
+          </person_name>
+          <person_name sequence="additional"
+                       contributor_role="author">
+            <given_name>Norman</given_name>
+            <surname>Warthmann</surname>
+            <ORCID>https://orcid.org/0000-0002-1178-8409</ORCID>
+          </person_name>
+        </contributors>
+        <publication_date>
+          <month>03</month>
+          <day>25</day>
+          <year>2024</year>
+        </publication_date>
+        <pages>
+          <first_page>6062</first_page>
+        </pages>
+        <publisher_item>
+          <identifier id_type="doi">10.21105/joss.06062</identifier>
+        </publisher_item>
+        <ai:program name="AccessIndicators">
+          <ai:license_ref applies_to="vor">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+          <ai:license_ref applies_to="am">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+          <ai:license_ref applies_to="tdm">http://creativecommons.org/licenses/by/4.0/</ai:license_ref>
+        </ai:program>
+        <rel:program>
+          <rel:related_item>
+            <rel:description>Software archive</rel:description>
+            <rel:inter_work_relation relationship-type="references" identifier-type="doi">10.5281/zenodo.10795245</rel:inter_work_relation>
+          </rel:related_item>
+          <rel:related_item>
+            <rel:description>GitHub review issue</rel:description>
+            <rel:inter_work_relation relationship-type="hasReview" identifier-type="uri">https://github.com/openjournals/joss-reviews/issues/6062</rel:inter_work_relation>
+          </rel:related_item>
+        </rel:program>
+        <doi_data>
+          <doi>10.21105/joss.06062</doi>
+          <resource>https://joss.theoj.org/papers/10.21105/joss.06062</resource>
+          <collection property="text-mining">
+            <item>
+              <resource mime_type="application/pdf">https://joss.theoj.org/papers/10.21105/joss.06062.pdf</resource>
+            </item>
+          </collection>
+        </doi_data>
+        <citation_list>
+          <citation key="ahrens21_genomicconstraints">
+            <article_title>Genomic constraints to drought
+adaptation</article_title>
+            <author>Ahrens</author>
+            <doi>10.1101/2021.08.07.455511</doi>
+            <cYear>2021</cYear>
+            <unstructured_citation>Ahrens, C. W., Murray, K. D.,
+Mazanec, R. A., Ferguson, S., Bragg, J., Jones, A., Tissue, D. T.,
+Byrne, M., Borevitz, J. O., &amp; Rymer, P. D. (2021, August 8). Genomic
+constraints to drought adaptation.
+https://doi.org/10.1101/2021.08.07.455511</unstructured_citation>
+          </citation>
+          <citation key="beber23_taxpastataxonomic">
+            <article_title>TAXPASTA: TAXonomic Profile Aggregation and
+STAndardisation</article_title>
+            <author>Beber</author>
+            <journal_title>Journal of Open Source
+Software</journal_title>
+            <issue>87</issue>
+            <volume>8</volume>
+            <doi>10.21105/joss.05627</doi>
+            <issn>2475-9066</issn>
+            <cYear>2023</cYear>
+            <unstructured_citation>Beber, M. E., Borry, M., Stamouli,
+S., &amp; Yates, J. A. F. (2023). TAXPASTA: TAXonomic Profile
+Aggregation and STAndardisation. Journal of Open Source Software, 8(87),
+5627. https://doi.org/10.21105/joss.05627</unstructured_citation>
+          </citation>
+          <citation key="buchfink21_sensitive">
+            <article_title>Sensitive protein alignments at tree-of-life
+scale using DIAMOND</article_title>
+            <author>Buchfink</author>
+            <journal_title>Nature Methods</journal_title>
+            <issue>4, 4</issue>
+            <volume>18</volume>
+            <doi>10.1038/s41592-021-01101-x</doi>
+            <issn>1548-7105</issn>
+            <cYear>2021</cYear>
+            <unstructured_citation>Buchfink, B., Reuter, K., &amp;
+Drost, H.-G. (2021). Sensitive protein alignments at tree-of-life scale
+using DIAMOND. Nature Methods, 18(4, 4), 366–368.
+https://doi.org/10.1038/s41592-021-01101-x</unstructured_citation>
+          </citation>
+          <citation key="danecek21_twelveyears">
+            <article_title>Twelve years of SAMtools and
+BCFtools</article_title>
+            <author>Danecek</author>
+            <journal_title>GigaScience</journal_title>
+            <issue>2</issue>
+            <volume>10</volume>
+            <doi>10.1093/gigascience/giab008</doi>
+            <issn>2047-217X</issn>
+            <cYear>2021</cYear>
+            <unstructured_citation>Danecek, P., Bonfield, J. K., Liddle,
+J., Marshall, J., Ohan, V., Pollard, M. O., Whitwham, A., Keane, T.,
+McCarthy, S. A., Davies, R. M., &amp; Li, H. (2021). Twelve years of
+SAMtools and BCFtools. GigaScience, 10(2), giab008.
+https://doi.org/10.1093/gigascience/giab008</unstructured_citation>
+          </citation>
+          <citation key="ewels16_multiqcsummarize">
+            <article_title>MultiQC: Summarize analysis results for
+multiple tools and samples in a single report</article_title>
+            <author>Ewels</author>
+            <journal_title>Bioinformatics (Oxford,
+England)</journal_title>
+            <issue>19</issue>
+            <volume>32</volume>
+            <doi>10.1093/bioinformatics/btw354</doi>
+            <issn>1367-4811</issn>
+            <cYear>2016</cYear>
+            <unstructured_citation>Ewels, P., Magnusson, M., Lundin, S.,
+&amp; Käller, M. (2016). MultiQC: Summarize analysis results for
+multiple tools and samples in a single report. Bioinformatics (Oxford,
+England), 32(19), 3047–3048.
+https://doi.org/10.1093/bioinformatics/btw354</unstructured_citation>
+          </citation>
+          <citation key="kim16_centrifugerapid">
+            <article_title>Centrifuge: Rapid and sensitive
+classification of metagenomic sequences</article_title>
+            <author>Kim</author>
+            <journal_title>Genome Research</journal_title>
+            <doi>10.1101/gr.210641.116</doi>
+            <issn>1088-9051</issn>
+            <cYear>2016</cYear>
+            <unstructured_citation>Kim, D., Song, L., Breitwieser, F.
+P., &amp; Salzberg, S. L. (2016). Centrifuge: Rapid and sensitive
+classification of metagenomic sequences. Genome Research.
+https://doi.org/10.1101/gr.210641.116</unstructured_citation>
+          </citation>
+          <citation key="koster12_snakemakescalable">
+            <article_title>Snakemake — a scalable bioinformatics
+workflow engine</article_title>
+            <author>Köster</author>
+            <journal_title>Bioinformatics</journal_title>
+            <issue>19</issue>
+            <volume>28</volume>
+            <doi>10.1093/bioinformatics/bts480</doi>
+            <issn>1367-4803</issn>
+            <cYear>2012</cYear>
+            <unstructured_citation>Köster, J., &amp; Rahmann, S. (2012).
+Snakemake — a scalable bioinformatics workflow engine. Bioinformatics,
+28(19), 2520–2522.
+https://doi.org/10.1093/bioinformatics/bts480</unstructured_citation>
+          </citation>
+          <citation key="koster21_snakemakeworkflows">
+            <article_title>Snakemake-workflows/dna-seq-gatk-variant-calling</article_title>
+            <author>Köster</author>
+            <doi>10.5281/ZENODO.4677629</doi>
+            <cYear>2021</cYear>
+            <unstructured_citation>Köster, J., Micwessolly, Kuthe, E.,
+&amp; De Coster, W. (2021).
+Snakemake-workflows/dna-seq-gatk-variant-calling.
+https://doi.org/10.5281/ZENODO.4677629</unstructured_citation>
+          </citation>
+          <citation key="li09_sequencealignment">
+            <article_title>The Sequence Alignment/Map format and
+SAMtools</article_title>
+            <author>Li</author>
+            <journal_title>Bioinformatics (Oxford,
+England)</journal_title>
+            <issue>16</issue>
+            <volume>25</volume>
+            <doi>10.1093/bioinformatics/btp352</doi>
+            <issn>1367-4811</issn>
+            <cYear>2009</cYear>
+            <unstructured_citation>Li, H., Handsaker, B., Wysoker, A.,
+Fennell, T., Ruan, J., Homer, N., Marth, G., Abecasis, G., Durbin, R.,
+&amp; 1000 Genome Project Data Processing Subgroup. (2009). The Sequence
+Alignment/Map format and SAMtools. Bioinformatics (Oxford, England),
+25(16), 2078–2079.
+https://doi.org/10.1093/bioinformatics/btp352</unstructured_citation>
+          </citation>
+          <citation key="li13_aligningsequence">
+            <article_title>Aligning sequence reads, clone sequences and
+assembly contigs with BWA-MEM</article_title>
+            <author>Li</author>
+            <doi>10.48550/arXiv.1303.3997</doi>
+            <cYear>2013</cYear>
+            <unstructured_citation>Li, H. (2013). Aligning sequence
+reads, clone sequences and assembly contigs with BWA-MEM.
+https://doi.org/10.48550/arXiv.1303.3997</unstructured_citation>
+          </citation>
+          <citation key="li18_minimap2pairwise">
+            <article_title>Minimap2: Pairwise alignment for nucleotide
+sequences</article_title>
+            <author>Li</author>
+            <journal_title>Bioinformatics</journal_title>
+            <issue>18</issue>
+            <volume>34</volume>
+            <doi>10.1093/bioinformatics/bty191</doi>
+            <issn>1367-4803</issn>
+            <cYear>2018</cYear>
+            <unstructured_citation>Li, H. (2018). Minimap2: Pairwise
+alignment for nucleotide sequences. Bioinformatics, 34(18), 3094–3100.
+https://doi.org/10.1093/bioinformatics/bty191</unstructured_citation>
+          </citation>
+          <citation key="li21_newstrategies">
+            <article_title>New strategies to improve Minimap2 alignment
+accuracy</article_title>
+            <author>Li</author>
+            <journal_title>Bioinformatics</journal_title>
+            <issue>23</issue>
+            <volume>37</volume>
+            <doi>10.1093/bioinformatics/btab705</doi>
+            <issn>1367-4803</issn>
+            <cYear>2021</cYear>
+            <unstructured_citation>Li, H. (2021). New strategies to
+improve Minimap2 alignment accuracy. Bioinformatics, 37(23), 4572–4574.
+https://doi.org/10.1093/bioinformatics/btab705</unstructured_citation>
+          </citation>
+          <citation key="lu17_brackenestimating">
+            <article_title>Bracken: Estimating species abundance in
+metagenomics data</article_title>
+            <author>Lu</author>
+            <journal_title>PeerJ Computer Science</journal_title>
+            <volume>3</volume>
+            <doi>10.7717/peerj-cs.104</doi>
+            <issn>2376-5992</issn>
+            <cYear>2017</cYear>
+            <unstructured_citation>Lu, J., Breitwieser, F. P., Thielen,
+P., &amp; Salzberg, S. L. (2017). Bracken: Estimating species abundance
+in metagenomics data. PeerJ Computer Science, 3, e104.
+https://doi.org/10.7717/peerj-cs.104</unstructured_citation>
+          </citation>
+          <citation key="menzel16_fastsensitive">
+            <article_title>Fast and sensitive taxonomic classification
+for metagenomics with Kaiju</article_title>
+            <author>Menzel</author>
+            <journal_title>Nature Communications</journal_title>
+            <volume>7</volume>
+            <doi>10.1038/ncomms11257</doi>
+            <issn>2041-1723</issn>
+            <cYear>2016</cYear>
+            <unstructured_citation>Menzel, P., Ng, K. L., &amp; Krogh,
+A. (2016). Fast and sensitive taxonomic classification for metagenomics
+with Kaiju. Nature Communications, 7, 11257.
+https://doi.org/10.1038/ncomms11257</unstructured_citation>
+          </citation>
+          <citation key="murray17_kwipkmer">
+            <article_title>kWIP: The k-mer weighted inner product, a de
+novo estimator of genetic similarity</article_title>
+            <author>Murray</author>
+            <journal_title>PLOS Computational Biology</journal_title>
+            <issue>9</issue>
+            <volume>13</volume>
+            <doi>10.1371/journal.pcbi.1005727</doi>
+            <issn>1553-7358</issn>
+            <cYear>2017</cYear>
+            <unstructured_citation>Murray, K. D., Webers, C., Ong, C.
+S., Borevitz, J., &amp; Warthmann, N. (2017). kWIP: The k-mer weighted
+inner product, a de novo estimator of genetic similarity. PLOS
+Computational Biology, 13(9), e1005727.
+https://doi.org/10.1371/journal.pcbi.1005727</unstructured_citation>
+          </citation>
+          <citation key="murray19_landscapedrivers">
+            <article_title>Landscape drivers of genomic diversity and
+divergence in woodland Eucalyptus</article_title>
+            <author>Murray</author>
+            <journal_title>Molecular Ecology</journal_title>
+            <issue>24</issue>
+            <volume>28</volume>
+            <doi>10.1111/mec.15287</doi>
+            <issn>0962-1083</issn>
+            <cYear>2019</cYear>
+            <unstructured_citation>Murray, K. D., Janes, J. K., Jones,
+A., Bothwell, H. M., Andrew, R. L., &amp; Borevitz, J. O. (2019).
+Landscape drivers of genomic diversity and divergence in woodland
+Eucalyptus. Molecular Ecology, 28(24), 5232–5247.
+https://doi.org/10.1111/mec.15287</unstructured_citation>
+          </citation>
+          <citation key="ondov16_mashfast">
+            <article_title>Mash: Fast genome and metagenome distance
+estimation using MinHash</article_title>
+            <author>Ondov</author>
+            <journal_title>Genome Biology</journal_title>
+            <volume>17</volume>
+            <doi>10.1186/s13059-016-0997-x</doi>
+            <issn>1474-760X</issn>
+            <cYear>2016</cYear>
+            <unstructured_citation>Ondov, B. D., Treangen, T. J.,
+Melsted, P., Mallonee, A. B., Bergman, N. H., Koren, S., &amp;
+Phillippy, A. M. (2016). Mash: Fast genome and metagenome distance
+estimation using MinHash. Genome Biology, 17, 132.
+https://doi.org/10.1186/s13059-016-0997-x</unstructured_citation>
+          </citation>
+          <citation key="pedersen18_mosdepthquick">
+            <article_title>Mosdepth: Quick coverage calculation for
+genomes and exomes</article_title>
+            <author>Pedersen</author>
+            <journal_title>Bioinformatics (Oxford,
+England)</journal_title>
+            <issue>5</issue>
+            <volume>34</volume>
+            <doi>10.1093/bioinformatics/btx699</doi>
+            <issn>1367-4811</issn>
+            <cYear>2018</cYear>
+            <unstructured_citation>Pedersen, B. S., &amp; Quinlan, A. R.
+(2018). Mosdepth: Quick coverage calculation for genomes and exomes.
+Bioinformatics (Oxford, England), 34(5), 867–868.
+https://doi.org/10.1093/bioinformatics/btx699</unstructured_citation>
+          </citation>
+          <citation key="regalado20_combining">
+            <article_title>Combining whole-genome shotgun sequencing and
+rRNA gene amplicon analyses to improve detection of microbe–microbe
+interaction networks in plant leaves</article_title>
+            <author>Regalado</author>
+            <journal_title>The ISME Journal</journal_title>
+            <issue>8, 8</issue>
+            <volume>14</volume>
+            <doi>10.1038/s41396-020-0665-8</doi>
+            <issn>1751-7370</issn>
+            <cYear>2020</cYear>
+            <unstructured_citation>Regalado, J., Lundberg, D. S.,
+Deusch, O., Kersten, S., Karasov, T., Poersch, K., Shirsekar, G., &amp;
+Weigel, D. (2020). Combining whole-genome shotgun sequencing and rRNA
+gene amplicon analyses to improve detection of microbe–microbe
+interaction networks in plant leaves. The ISME Journal, 14(8, 8),
+2116–2130.
+https://doi.org/10.1038/s41396-020-0665-8</unstructured_citation>
+          </citation>
+          <citation key="schubert16_adapterremoval">
+            <article_title>AdapterRemoval v2: Rapid adapter trimming,
+identification, and read merging</article_title>
+            <author>Schubert</author>
+            <journal_title>BMC Research Notes</journal_title>
+            <volume>9</volume>
+            <doi>10.1186/s13104-016-1900-2</doi>
+            <issn>1756-0500</issn>
+            <cYear>2016</cYear>
+            <unstructured_citation>Schubert, M., Lindgreen, S., &amp;
+Orlando, L. (2016). AdapterRemoval v2: Rapid adapter trimming,
+identification, and read merging. BMC Research Notes, 9, 88.
+https://doi.org/10.1186/s13104-016-1900-2</unstructured_citation>
+          </citation>
+          <citation key="sedlazeck13_nextgenmapfast">
+            <article_title>NextGenMap: Fast and accurate read mapping in
+highly polymorphic genomes</article_title>
+            <author>Sedlazeck</author>
+            <journal_title>Bioinformatics</journal_title>
+            <issue>21</issue>
+            <volume>29</volume>
+            <doi>10.1093/bioinformatics/btt468</doi>
+            <issn>1367-4803</issn>
+            <cYear>2013</cYear>
+            <unstructured_citation>Sedlazeck, F. J., Rescheneder, P.,
+&amp; Von Haeseler, A. (2013). NextGenMap: Fast and accurate read
+mapping in highly polymorphic genomes. Bioinformatics, 29(21),
+2790–2791.
+https://doi.org/10.1093/bioinformatics/btt468</unstructured_citation>
+          </citation>
+          <citation key="wood19_improved">
+            <article_title>Improved metagenomic analysis with Kraken
+2</article_title>
+            <author>Wood</author>
+            <journal_title>Genome Biology</journal_title>
+            <issue>1, 1</issue>
+            <volume>20</volume>
+            <doi>10.1186/s13059-019-1891-0</doi>
+            <issn>1474-760X</issn>
+            <cYear>2019</cYear>
+            <unstructured_citation>Wood, D. E., Lu, J., &amp; Langmead,
+B. (2019). Improved metagenomic analysis with Kraken 2. Genome Biology,
+20(1, 1), 1–13.
+https://doi.org/10.1186/s13059-019-1891-0</unstructured_citation>
+          </citation>
+          <citation key="yates23_nfcore">
+            <article_title>Nf-core/taxprofiler</article_title>
+            <author>Yates</author>
+            <doi>10.5281/ZENODO.7728364</doi>
+            <cYear>2023</cYear>
+            <unstructured_citation>Yates, J. A. F., Stamouli, S.,
+Andersson-Li, L., Beber, M. E., Mesilaakso, L., Nf-Core Bot,
+Christensen, T. A., Mahwash Jamy, JIANHONG OU, Stepien, R., Borry, M.,
+Husen M. Umer, Syme, R., Hübner, A., &amp; Zandra Fagernäs. (2023).
+Nf-core/taxprofiler.
+https://doi.org/10.5281/ZENODO.7728364</unstructured_citation>
+          </citation>
+        </citation_list>
+      </journal_article>
+    </journal>
+  </body>
+</doi_batch>
diff --git a/joss.06062/10.21105.joss.06062.jats b/joss.06062/10.21105.joss.06062.jats
new file mode 100644
index 0000000000..d63a48baee
--- /dev/null
+++ b/joss.06062/10.21105.joss.06062.jats
@@ -0,0 +1,792 @@
+<?xml version="1.0" encoding="utf-8" ?>
+<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN"
+                  "JATS-publishing1.dtd">
+<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.2" article-type="other">
+<front>
+<journal-meta>
+<journal-id></journal-id>
+<journal-title-group>
+<journal-title>Journal of Open Source Software</journal-title>
+<abbrev-journal-title>JOSS</abbrev-journal-title>
+</journal-title-group>
+<issn publication-format="electronic">2475-9066</issn>
+<publisher>
+<publisher-name>Open Journals</publisher-name>
+</publisher>
+</journal-meta>
+<article-meta>
+<article-id pub-id-type="publisher-id">6062</article-id>
+<article-id pub-id-type="doi">10.21105/joss.06062</article-id>
+<title-group>
+<article-title>Acanthophis: a comprehensive plant hologenomics
+pipeline</article-title>
+</title-group>
+<contrib-group>
+<contrib contrib-type="author" corresp="yes">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2466-1917</contrib-id>
+<name>
+<surname>Murray</surname>
+<given-names>Kevin D.</given-names>
+</name>
+<email>kdmpapers@gmail.com</email>
+<xref ref-type="aff" rid="aff-1"/>
+<xref ref-type="corresp" rid="cor-1"><sup>*</sup></xref>
+</contrib>
+<contrib contrib-type="author">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-8408-3699</contrib-id>
+<name>
+<surname>Borevitz</surname>
+<given-names>Justin O.</given-names>
+</name>
+<xref ref-type="aff" rid="aff-2"/>
+</contrib>
+<contrib contrib-type="author">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2114-7963</contrib-id>
+<name>
+<surname>Weigel</surname>
+<given-names>Detlef</given-names>
+</name>
+<xref ref-type="aff" rid="aff-1"/>
+</contrib>
+<contrib contrib-type="author" corresp="yes">
+<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-1178-8409</contrib-id>
+<name>
+<surname>Warthmann</surname>
+<given-names>Norman</given-names>
+</name>
+<xref ref-type="aff" rid="aff-2"/>
+<xref ref-type="aff" rid="aff-3"/>
+<xref ref-type="corresp" rid="cor-2"><sup>*</sup></xref>
+</contrib>
+<aff id="aff-1">
+<institution-wrap>
+<institution>Max Planck Institute for Biology Tübingen, 72076 Tübingen,
+Germany</institution>
+</institution-wrap>
+</aff>
+<aff id="aff-2">
+<institution-wrap>
+<institution>Research School of Biology, Australian National University,
+Canberra, Australia</institution>
+</institution-wrap>
+</aff>
+<aff id="aff-3">
+<institution-wrap>
+<institution>FAO/IAEA Joint Centre of Nuclear Techniques in Food and
+Agriculture, Plant Breeding and Genetics Laboratory, Seibersdorf,
+Austria</institution>
+</institution-wrap>
+</aff>
+</contrib-group>
+<author-notes>
+<corresp id="cor-1">* E-mail: <email>kdmpapers@gmail.com</email></corresp>
+<corresp id="cor-2">* E-mail: <email></email></corresp>
+</author-notes>
+<pub-date date-type="pub" publication-format="electronic" iso-8601-date="2023-10-10">
+<day>10</day>
+<month>10</month>
+<year>2023</year>
+</pub-date>
+<volume>9</volume>
+<issue>95</issue>
+<fpage>6062</fpage>
+<permissions>
+<copyright-statement>Authors of papers retain copyright and release the
+work under a Creative Commons Attribution 4.0 International License (CC
+BY 4.0)</copyright-statement>
+<copyright-year>2022</copyright-year>
+<copyright-holder>The article authors</copyright-holder>
+<license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
+<license-p>Authors of papers retain copyright and release the work under
+a Creative Commons Attribution 4.0 International License (CC BY
+4.0)</license-p>
+</license>
+</permissions>
+<kwd-group kwd-group-type="author">
+<kwd>python</kwd>
+<kwd>snakemake</kwd>
+<kwd>plants</kwd>
+<kwd>metagenomics</kwd>
+<kwd>variant calling</kwd>
+<kwd>population genomics</kwd>
+<kwd>reference-free classification</kwd>
+</kwd-group>
+</article-meta>
+</front>
+<body>
+<sec id="summary">
+  <title>Summary</title>
+  <p>Acanthophis is a comprehensive pipeline for the joint analysis of
+  both host genetic variation and variation in the composition and
+  abundance of host-associated microbiomes (together, the “hologenome”).
+  Implemented in Snakemake
+  (<xref alt="Köster &amp; Rahmann, 2012" rid="ref-koster12_snakemakescalable" ref-type="bibr">Köster
+  &amp; Rahmann, 2012</xref>), Acanthophis handles data from raw FASTQ
+  read files through quality control, alignment of the reads to a plant
+  reference, variant calling, taxonomic classification and
+  quantification of microbes, and metagenome analysis. The workflow
+  contains numerous practical optimisations, both to reduce disk space
+  usage and maximise utilisation of computational resources. Acanthophis
+  is available under the Mozilla Public Licence v2 at
+  <ext-link ext-link-type="uri" xlink:href="https://github.com/kdm9/Acanthophis">https://github.com/kdm9/Acanthophis</ext-link>
+  as a python package installable from conda or PyPI
+  (<monospace>pip install acanthophis</monospace>).</p>
+</sec>
+<sec id="statement-of-need">
+  <title>Statement of Need</title>
+  <p>Understanding plant biology benefits from ecosystem-scale analysis
+  of genetic variation, and increasingly demands the characterisation of
+  not only plant genomes but also the genomes of their associated
+  microbes. Such analyses are often data intensive, particularly at the
+  scale required for quantitative analyses, i.e. hundreds to thousands
+  of samples
+  (<xref alt="Regalado et al., 2020" rid="ref-regalado20_combining" ref-type="bibr">Regalado
+  et al., 2020</xref>). They demand computationally-efficient pipelines
+  that perform both host genotyping and host-associated microbiome
+  characterisation in a consistent, flexible, and reproducible
+  fashion.</p>
+  <p>Currently, no such unified pipelines exist. Previous pipelines
+  perform only a subset of these tasks (e.g. Snakemake’s variant calling
+  pipeline; Köster et al.
+  (<xref alt="2021" rid="ref-koster21_snakemakeworkflows" ref-type="bibr">2021</xref>)).
+  In addition, most host-aware microbiome analysis pipelines do not
+  allow for genotyping and/or assume an animal host (e.g. Taxprofiler;
+  Yates et al.
+  (<xref alt="2023" rid="ref-yates23_nfcore" ref-type="bibr">2023</xref>)).
+  Acanthophis has attracted many users, and has been used in
+  peer-reviewed journal articles and preprints (e.g. Murray et al.
+  (<xref alt="2019" rid="ref-murray19_landscapedrivers" ref-type="bibr">2019</xref>);
+  Ahrens et al.
+  (<xref alt="2021" rid="ref-ahrens21_genomicconstraints" ref-type="bibr">2021</xref>)).</p>
+</sec>
+<sec id="components-and-features">
+  <title>Components and Features</title>
+  <p>Acanthophis is a pipeline for the analysis of plant population
+  resequencing data. It expects short-read shotgun whole (meta-)genome
+  sequencing data, typically of plants collected in the field (nothing
+  fundamentally prevents Acanthophis operating on long-read data,
+  however additional tools would need to be incorporated, which will
+  happen given sufficient user demand). A typical dataset might be
+  10s-1000s of samples from one or multiple closely related species,
+  sequenced with 2x150bp paired-end short read sequencing. In a
+  plant-microbe interaction genomics study, these plants and therefore
+  sequencing libraries can contain microbial DNA (a “hologenome”), but
+  datasets focusing only on host genome variation are also possible.
+  Acanthophis can be configured to do any of the following analyses:
+  mapping reads to a reference, calling variants, annotating variant
+  effects, estimating genetic distances directly from sequence reads
+  (<italic>de novo</italic>), and profiling and/or assembling
+  metagenomes. While we developed Acanthophis to handle plant data,
+  there is no reason why it cannot be applied to other taxa, although
+  some parameters may need adjustment (see below). Philosophically,
+  Acanthophis aims for maximum efficiency and flexibility, and therefore
+  does not bake any particular biological question into its outputs. As
+  such, each user should for example filter the resulting variant files
+  as appropriate for their biological question(s), and likewise apply
+  other post-processing as needed.</p>
+  <p>Across the entire pipeline, Acanthophis operates on ‘sample sets’,
+  named groups of one or more samples, and each sample can be in any
+  number of sample sets. The pipeline is configured via a global
+  <monospace>config.yaml</monospace> file, in which one can configure
+  the pipeline per sample-set. This way, one can configure the analyses
+  to be run (most of the below analysis stages can be skipped if not
+  needed), as well as tool-specific settings or thresholds. We provide a
+  documented template as well as a reproducible workflow to simulate
+  test data, which can be used as a basis for customisation. While
+  Acanthophis is cross-platform, most of the underlying tools are only
+  packaged for and/or only operate on GNU/Linux operating systems.
+  Therefore, Acanthophis is only actively supported for users on Linux
+  systems.</p>
+  <sec id="stage-1-raw-reads-to-per-sample-reads">
+    <title>Stage 1: Raw reads to per-sample reads</title>
+    <p>Input data consists of FASTQ files per <bold>run</bold> of each
+    <bold>library</bold> corresponding to a <bold>sample</bold>. For
+    each <bold>run</bold> of each <bold>library</bold>, Acanthophis uses
+    <monospace>AdapterRemoval</monospace>
+    (<xref alt="Schubert et al., 2016" rid="ref-schubert16_adapterremoval" ref-type="bibr">Schubert
+    et al., 2016</xref>) to remove low quality and adapter sequences,
+    and optionally to merge overlapping read pairs. It then uses
+    <monospace>FastQC</monospace> to summarise sequence QC before and
+    after <monospace>AdapterRemoval</monospace>.</p>
+  </sec>
+  <sec id="stage-2-alignment-to-references">
+    <title>Stage 2: Alignment to reference(s)</title>
+    <p>To align reads to reference genomes, Acanthophis can use any of
+    <monospace>BWA MEM</monospace>
+    (<xref alt="Li, 2013" rid="ref-li13_aligningsequence" ref-type="bibr">Li,
+    2013</xref>), <monospace>NGM</monospace>
+    (<xref alt="Sedlazeck et al., 2013" rid="ref-sedlazeck13_nextgenmapfast" ref-type="bibr">Sedlazeck
+    et al., 2013</xref>), and <monospace>minimap2</monospace>
+    (<xref alt="Li, 2018" rid="ref-li18_minimap2pairwise" ref-type="bibr">Li,
+    2018</xref>,
+    <xref alt="2021" rid="ref-li21_newstrategies" ref-type="bibr">2021</xref>).
+    Then, Acanthophis merges per-runlib BAMs to per-sample BAMs, and
+    uses <monospace>samtools markdup</monospace>
+    (<xref alt="Danecek et al., 2021" rid="ref-danecek21_twelveyears" ref-type="bibr">Danecek
+    et al., 2021</xref>;
+    <xref alt="Li et al., 2009" rid="ref-li09_sequencealignment" ref-type="bibr">Li
+    et al., 2009</xref>) to mark duplicate reads. Input reference
+    genomes should be uncompressed,
+    <monospace>samtools faidx</monospace>ed FASTA files.</p>
+  </sec>
+  <sec id="stage-3-variant-calling">
+    <title>Stage 3: Variant Calling</title>
+    <p>Acanthophis uses <monospace>bcftools mpileup</monospace> and/or
+    <monospace>freebayes</monospace> to call raw variants, using priors
+    and thresholds configurable for each sample set. It then normalises
+    variants with <monospace>bcftools norm</monospace>, splits
+    multi-allelic variants, filters each allele with per-sample set
+    filters, and combines filter-passing bialelic sites back into single
+    multi-allelic sites, merges region-level VCFs, indexes, and
+    calculates statistics on these final VCF files. Acanthophis provides
+    two alternative approaches to parallelise variant calling: either a
+    static list of non-overlapping genome windows (supplied in a BED
+    file), or genome bins with approximately equal amounts of data,
+    which are automatically generated using mosdepth
+    (<xref alt="Pedersen &amp; Quinlan, 2018" rid="ref-pedersen18_mosdepthquick" ref-type="bibr">Pedersen
+    &amp; Quinlan, 2018</xref>).</p>
+  </sec>
+  <sec id="stage-4-taxon-profiling">
+    <title>Stage 4: Taxon profiling</title>
+    <p>Acanthophis can create taxonomic profiles of each sample with
+    reference to either public sequence databases (e.g. NCBI’s
+    <monospace>nt</monospace> or <monospace>refseq</monospace>), or
+    user-supplied databases. Acanthophis can utilise any of Kraken 2
+    (<xref alt="Wood et al., 2019" rid="ref-wood19_improved" ref-type="bibr">Wood
+    et al., 2019</xref>), Bracken
+    (<xref alt="Lu et al., 2017" rid="ref-lu17_brackenestimating" ref-type="bibr">Lu
+    et al., 2017</xref>), Kaiju
+    (<xref alt="Menzel et al., 2016" rid="ref-menzel16_fastsensitive" ref-type="bibr">Menzel
+    et al., 2016</xref>), Centrifuge
+    (<xref alt="Kim et al., 2016" rid="ref-kim16_centrifugerapid" ref-type="bibr">Kim
+    et al., 2016</xref>), and Diamond
+    (<xref alt="Buchfink et al., 2021" rid="ref-buchfink21_sensitive" ref-type="bibr">Buchfink
+    et al., 2021</xref>) to create taxonomic profiles for each sample
+    against any number of taxon identification databases; most tools
+    supply pre-computed indices for public databases. Acanthophis can
+    then optionally use taxpasta
+    (<xref alt="Beber et al., 2023" rid="ref-beber23_taxpastataxonomic" ref-type="bibr">Beber
+    et al., 2023</xref>) to merge multiple profiles into a single
+    combined table for easy downstream use.</p>
+  </sec>
+  <sec id="stage-5-de-novo-estimates-of-genetic-dissimilarity">
+    <title>Stage 5: <italic>De novo</italic> Estimates of Genetic
+    Dissimilarity</title>
+    <p>Acanthophis can use either <monospace>kWIP</monospace>
+    (<xref alt="Murray et al., 2017" rid="ref-murray17_kwipkmer" ref-type="bibr">Murray
+    et al., 2017</xref>) or Mash
+    (<xref alt="Ondov et al., 2016" rid="ref-ondov16_mashfast" ref-type="bibr">Ondov
+    et al., 2016</xref>) to estimate genetic distances between samples
+    without alignment to a reference genome. These features first count
+    reads into k-mer sketches, and then calculate pairwise distances
+    among samples.</p>
+  </sec>
+  <sec id="stage-6-reporting-and-statistics">
+    <title>Stage 6: Reporting and Statistics</title>
+    <p>Throughout all pipeline stages, various tools output summaries of
+    their actions and/or outputs. We optionally combine these into
+    unified reports by pipeline stage and sample set using MultiQC
+    (<xref alt="Ewels et al., 2016" rid="ref-ewels16_multiqcsummarize" ref-type="bibr">Ewels
+    et al., 2016</xref>), allowing plotting of raw sequence QC
+    statistics, alignment QC statistics, variant QC statistics, and
+    summarisation of taxonomic identification analyses.</p>
+  </sec>
+</sec>
+<sec id="acknowledgements">
+  <title>Acknowledgements</title>
+  <p>We thank Brice Letcher, George Bouras, Abhishek Tiwari, Luisa
+  Teasdale, Anne-Cecile Colin, Rose Andrew, Johannes Köster, and Scott
+  Ferguson for comments or advice on Acanthophis and/or on this
+  manuscript. KDM is supported by a Marie Skłodowska-Curie Actions
+  fellowship. This project has received funding from the European
+  Research Council (ERC) under the European Union’s Horizon 2020
+  research and innovation program (grant agreement No. 951444-PATHOCOM
+  to DW). This work was supported financially by the Australian Research
+  Council (CE140100008; DP150103591; DE190100326). The research was
+  undertaken with the assistance of resources from the National
+  Computational Infrastructure (NCI), which is supported by the
+  Australian Government.</p>
+</sec>
+</body>
+<back>
+<ref-list>
+  <ref id="ref-ahrens21_genomicconstraints">
+    <element-citation publication-type="webpage">
+      <person-group person-group-type="author">
+        <name><surname>Ahrens</surname><given-names>Collin W.</given-names></name>
+        <name><surname>Murray</surname><given-names>Kevin D.</given-names></name>
+        <name><surname>Mazanec</surname><given-names>Richard A.</given-names></name>
+        <name><surname>Ferguson</surname><given-names>Scott</given-names></name>
+        <name><surname>Bragg</surname><given-names>Jason</given-names></name>
+        <name><surname>Jones</surname><given-names>Ashley</given-names></name>
+        <name><surname>Tissue</surname><given-names>David T.</given-names></name>
+        <name><surname>Byrne</surname><given-names>Margaret</given-names></name>
+        <name><surname>Borevitz</surname><given-names>Justin O.</given-names></name>
+        <name><surname>Rymer</surname><given-names>Paul D.</given-names></name>
+      </person-group>
+      <article-title>Genomic constraints to drought adaptation</article-title>
+      <year iso-8601-date="2021-08-08">2021</year><month>08</month><day>08</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-09">2023</year><month>10</month><day>09</day></date-in-citation>
+      <uri>https://www.biorxiv.org/content/10.1101/2021.08.07.455511v1</uri>
+      <pub-id pub-id-type="doi">10.1101/2021.08.07.455511</pub-id>
+      <fpage>2021.08.07.455511</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-beber23_taxpastataxonomic">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Beber</surname><given-names>Moritz E.</given-names></name>
+        <name><surname>Borry</surname><given-names>Maxime</given-names></name>
+        <name><surname>Stamouli</surname><given-names>Sofia</given-names></name>
+        <name><surname>Yates</surname><given-names>James A. Fellows</given-names></name>
+      </person-group>
+      <article-title>TAXPASTA: TAXonomic Profile Aggregation and STAndardisation</article-title>
+      <source>Journal of Open Source Software</source>
+      <year iso-8601-date="2023-07-11">2023</year><month>07</month><day>11</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-04">2023</year><month>10</month><day>04</day></date-in-citation>
+      <volume>8</volume>
+      <issue>87</issue>
+      <issn>2475-9066</issn>
+      <uri>https://joss.theoj.org/papers/10.21105/joss.05627</uri>
+      <pub-id pub-id-type="doi">10.21105/joss.05627</pub-id>
+      <fpage>5627</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-buchfink21_sensitive">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Buchfink</surname><given-names>Benjamin</given-names></name>
+        <name><surname>Reuter</surname><given-names>Klaus</given-names></name>
+        <name><surname>Drost</surname><given-names>Hajk-Georg</given-names></name>
+      </person-group>
+      <article-title>Sensitive protein alignments at tree-of-life scale using DIAMOND</article-title>
+      <source>Nature Methods</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2021-04">2021</year><month>04</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2024-02-01">2024</year><month>02</month><day>01</day></date-in-citation>
+      <volume>18</volume>
+      <issue>4, 4</issue>
+      <issn>1548-7105</issn>
+      <uri>https://www.nature.com/articles/s41592-021-01101-x</uri>
+      <pub-id pub-id-type="doi">10.1038/s41592-021-01101-x</pub-id>
+      <fpage>366</fpage>
+      <lpage>368</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-danecek21_twelveyears">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Danecek</surname><given-names>Petr</given-names></name>
+        <name><surname>Bonfield</surname><given-names>James K.</given-names></name>
+        <name><surname>Liddle</surname><given-names>Jennifer</given-names></name>
+        <name><surname>Marshall</surname><given-names>John</given-names></name>
+        <name><surname>Ohan</surname><given-names>Valeriu</given-names></name>
+        <name><surname>Pollard</surname><given-names>Martin O.</given-names></name>
+        <name><surname>Whitwham</surname><given-names>Andrew</given-names></name>
+        <name><surname>Keane</surname><given-names>Thomas</given-names></name>
+        <name><surname>McCarthy</surname><given-names>Shane A.</given-names></name>
+        <name><surname>Davies</surname><given-names>Robert M.</given-names></name>
+        <name><surname>Li</surname><given-names>Heng</given-names></name>
+      </person-group>
+      <article-title>Twelve years of SAMtools and BCFtools</article-title>
+      <source>GigaScience</source>
+      <year iso-8601-date="2021-02-16">2021</year><month>02</month><day>16</day>
+      <volume>10</volume>
+      <issue>2</issue>
+      <issn>2047-217X</issn>
+      <pub-id pub-id-type="doi">10.1093/gigascience/giab008</pub-id>
+      <fpage>giab008</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-ewels16_multiqcsummarize">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Ewels</surname><given-names>Philip</given-names></name>
+        <name><surname>Magnusson</surname><given-names>Måns</given-names></name>
+        <name><surname>Lundin</surname><given-names>Sverker</given-names></name>
+        <name><surname>Käller</surname><given-names>Max</given-names></name>
+      </person-group>
+      <article-title>MultiQC: Summarize analysis results for multiple tools and samples in a single report</article-title>
+      <source>Bioinformatics (Oxford, England)</source>
+      <year iso-8601-date="2016-10-01">2016</year><month>10</month><day>01</day>
+      <volume>32</volume>
+      <issue>19</issue>
+      <issn>1367-4811</issn>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/btw354</pub-id>
+      <fpage>3047</fpage>
+      <lpage>3048</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-kim16_centrifugerapid">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Kim</surname><given-names>Daehwan</given-names></name>
+        <name><surname>Song</surname><given-names>Li</given-names></name>
+        <name><surname>Breitwieser</surname><given-names>Florian P.</given-names></name>
+        <name><surname>Salzberg</surname><given-names>Steven L.</given-names></name>
+      </person-group>
+      <article-title>Centrifuge: Rapid and sensitive classification of metagenomic sequences</article-title>
+      <source>Genome Research</source>
+      <publisher-name>Cold Spring Harbor Lab</publisher-name>
+      <year iso-8601-date="2016-10-17">2016</year><month>10</month><day>17</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-04">2023</year><month>10</month><day>04</day></date-in-citation>
+      <issn>1088-9051</issn>
+      <uri>https://genome.cshlp.org/content/early/2016/11/16/gr.210641.116</uri>
+      <pub-id pub-id-type="doi">10.1101/gr.210641.116</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-koster12_snakemakescalable">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Köster</surname><given-names>Johannes</given-names></name>
+        <name><surname>Rahmann</surname><given-names>Sven</given-names></name>
+      </person-group>
+      <article-title>Snakemake — a scalable bioinformatics workflow engine</article-title>
+      <source>Bioinformatics</source>
+      <year iso-8601-date="2012-01-10">2012</year><month>01</month><day>10</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2016-03-30">2016</year><month>03</month><day>30</day></date-in-citation>
+      <volume>28</volume>
+      <issue>19</issue>
+      <issn>1367-4803</issn>
+      <uri>http://bioinformatics.oxfordjournals.org/content/28/19/2520</uri>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/bts480</pub-id>
+      <fpage>2520</fpage>
+      <lpage>2522</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-koster21_snakemakeworkflows">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Köster</surname><given-names>Johannes</given-names></name>
+        <string-name>Micwessolly</string-name>
+        <name><surname>Kuthe</surname><given-names>Elias</given-names></name>
+        <name><surname>De Coster</surname><given-names>Wouter</given-names></name>
+      </person-group>
+      <article-title>Snakemake-workflows/dna-seq-gatk-variant-calling</article-title>
+      <year iso-8601-date="2021-05-02">2021</year><month>05</month><day>02</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-09">2023</year><month>10</month><day>09</day></date-in-citation>
+      <uri>https://zenodo.org/record/4677629</uri>
+      <pub-id pub-id-type="doi">10.5281/ZENODO.4677629</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-li09_sequencealignment">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Li</surname><given-names>Heng</given-names></name>
+        <name><surname>Handsaker</surname><given-names>Bob</given-names></name>
+        <name><surname>Wysoker</surname><given-names>Alec</given-names></name>
+        <name><surname>Fennell</surname><given-names>Tim</given-names></name>
+        <name><surname>Ruan</surname><given-names>Jue</given-names></name>
+        <name><surname>Homer</surname><given-names>Nils</given-names></name>
+        <name><surname>Marth</surname><given-names>Gabor</given-names></name>
+        <name><surname>Abecasis</surname><given-names>Goncalo</given-names></name>
+        <name><surname>Durbin</surname><given-names>Richard</given-names></name>
+        <string-name>1000 Genome Project Data Processing Subgroup</string-name>
+      </person-group>
+      <article-title>The Sequence Alignment/Map format and SAMtools</article-title>
+      <source>Bioinformatics (Oxford, England)</source>
+      <year iso-8601-date="2009-08-15">2009</year><month>08</month><day>15</day>
+      <volume>25</volume>
+      <issue>16</issue>
+      <issn>1367-4811</issn>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id>
+      <fpage>2078</fpage>
+      <lpage>2079</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-li13_aligningsequence">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Li</surname><given-names>Heng</given-names></name>
+      </person-group>
+      <article-title>Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM</article-title>
+      <year iso-8601-date="2013-03-16">2013</year><month>03</month><day>16</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2019-01-02">2019</year><month>01</month><day>02</day></date-in-citation>
+      <uri>https://arxiv.org/abs/1303.3997v2</uri>
+      <pub-id pub-id-type="doi">10.48550/arXiv.1303.3997</pub-id>
+    </element-citation>
+  </ref>
+  <ref id="ref-li18_minimap2pairwise">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Li</surname><given-names>Heng</given-names></name>
+      </person-group>
+      <article-title>Minimap2: Pairwise alignment for nucleotide sequences</article-title>
+      <source>Bioinformatics</source>
+      <person-group person-group-type="editor">
+        <name><surname>Birol</surname><given-names>Inanc</given-names></name>
+      </person-group>
+      <year iso-8601-date="2018-09-15">2018</year><month>09</month><day>15</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-04">2023</year><month>10</month><day>04</day></date-in-citation>
+      <volume>34</volume>
+      <issue>18</issue>
+      <issn>1367-4803</issn>
+      <uri>https://academic.oup.com/bioinformatics/article/34/18/3094/4994778</uri>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id>
+      <fpage>3094</fpage>
+      <lpage>3100</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-li21_newstrategies">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Li</surname><given-names>Heng</given-names></name>
+      </person-group>
+      <article-title>New strategies to improve Minimap2 alignment accuracy</article-title>
+      <source>Bioinformatics</source>
+      <person-group person-group-type="editor">
+        <name><surname>Alkan</surname><given-names>Can</given-names></name>
+      </person-group>
+      <year iso-8601-date="2021-12-07">2021</year><month>12</month><day>07</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-04">2023</year><month>10</month><day>04</day></date-in-citation>
+      <volume>37</volume>
+      <issue>23</issue>
+      <issn>1367-4803</issn>
+      <uri>https://academic.oup.com/bioinformatics/article/37/23/4572/6384570</uri>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/btab705</pub-id>
+      <fpage>4572</fpage>
+      <lpage>4574</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-lu17_brackenestimating">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Lu</surname><given-names>Jennifer</given-names></name>
+        <name><surname>Breitwieser</surname><given-names>Florian P.</given-names></name>
+        <name><surname>Thielen</surname><given-names>Peter</given-names></name>
+        <name><surname>Salzberg</surname><given-names>Steven L.</given-names></name>
+      </person-group>
+      <article-title>Bracken: Estimating species abundance in metagenomics data</article-title>
+      <source>PeerJ Computer Science</source>
+      <year iso-8601-date="2017-01-02">2017</year><month>01</month><day>02</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2017-08-08">2017</year><month>08</month><day>08</day></date-in-citation>
+      <volume>3</volume>
+      <issn>2376-5992</issn>
+      <uri>https://peerj.com/articles/cs-104</uri>
+      <pub-id pub-id-type="doi">10.7717/peerj-cs.104</pub-id>
+      <fpage>e104</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-menzel16_fastsensitive">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Menzel</surname><given-names>Peter</given-names></name>
+        <name><surname>Ng</surname><given-names>Kim Lee</given-names></name>
+        <name><surname>Krogh</surname><given-names>Anders</given-names></name>
+      </person-group>
+      <article-title>Fast and sensitive taxonomic classification for metagenomics with Kaiju</article-title>
+      <source>Nature Communications</source>
+      <year iso-8601-date="2016-04-13">2016</year><month>04</month><day>13</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2016-09-27">2016</year><month>09</month><day>27</day></date-in-citation>
+      <volume>7</volume>
+      <issn>2041-1723</issn>
+      <uri>http://www.nature.com/doifinder/10.1038/ncomms11257</uri>
+      <pub-id pub-id-type="doi">10.1038/ncomms11257</pub-id>
+      <fpage>11257</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-murray17_kwipkmer">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Murray</surname><given-names>Kevin D.</given-names></name>
+        <name><surname>Webers</surname><given-names>Christfried</given-names></name>
+        <name><surname>Ong</surname><given-names>Cheng Soon</given-names></name>
+        <name><surname>Borevitz</surname><given-names>Justin</given-names></name>
+        <name><surname>Warthmann</surname><given-names>Norman</given-names></name>
+      </person-group>
+      <article-title>kWIP: The k-mer weighted inner product, a de novo estimator of genetic similarity</article-title>
+      <source>PLOS Computational Biology</source>
+      <year iso-8601-date="2017-09-05">2017</year><month>09</month><day>05</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2017-09-10">2017</year><month>09</month><day>10</day></date-in-citation>
+      <volume>13</volume>
+      <issue>9</issue>
+      <issn>1553-7358</issn>
+      <uri>http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1005727</uri>
+      <pub-id pub-id-type="doi">10.1371/journal.pcbi.1005727</pub-id>
+      <fpage>e1005727</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-murray19_landscapedrivers">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Murray</surname><given-names>Kevin D.</given-names></name>
+        <name><surname>Janes</surname><given-names>Jasmine K</given-names></name>
+        <name><surname>Jones</surname><given-names>Ashley</given-names></name>
+        <name><surname>Bothwell</surname><given-names>Helen M</given-names></name>
+        <name><surname>Andrew</surname><given-names>Rose L</given-names></name>
+        <name><surname>Borevitz</surname><given-names>Justin O</given-names></name>
+      </person-group>
+      <article-title>Landscape drivers of genomic diversity and divergence in woodland Eucalyptus</article-title>
+      <source>Molecular Ecology</source>
+      <year iso-8601-date="2019-12">2019</year><month>12</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2020-08-26">2020</year><month>08</month><day>26</day></date-in-citation>
+      <volume>28</volume>
+      <issue>24</issue>
+      <issn>0962-1083</issn>
+      <uri>https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7065176/</uri>
+      <pub-id pub-id-type="doi">10.1111/mec.15287</pub-id>
+      <fpage>5232</fpage>
+      <lpage>5247</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-ondov16_mashfast">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Ondov</surname><given-names>Brian D.</given-names></name>
+        <name><surname>Treangen</surname><given-names>Todd J.</given-names></name>
+        <name><surname>Melsted</surname><given-names>Páll</given-names></name>
+        <name><surname>Mallonee</surname><given-names>Adam B.</given-names></name>
+        <name><surname>Bergman</surname><given-names>Nicholas H.</given-names></name>
+        <name><surname>Koren</surname><given-names>Sergey</given-names></name>
+        <name><surname>Phillippy</surname><given-names>Adam M.</given-names></name>
+      </person-group>
+      <article-title>Mash: Fast genome and metagenome distance estimation using MinHash</article-title>
+      <source>Genome Biology</source>
+      <year iso-8601-date="2016">2016</year>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2016-08-30">2016</year><month>08</month><day>30</day></date-in-citation>
+      <volume>17</volume>
+      <issn>1474-760X</issn>
+      <uri>http://dx.doi.org/10.1186/s13059-016-0997-x</uri>
+      <pub-id pub-id-type="doi">10.1186/s13059-016-0997-x</pub-id>
+      <fpage>132</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-pedersen18_mosdepthquick">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Pedersen</surname><given-names>Brent S.</given-names></name>
+        <name><surname>Quinlan</surname><given-names>Aaron R.</given-names></name>
+      </person-group>
+      <article-title>Mosdepth: Quick coverage calculation for genomes and exomes</article-title>
+      <source>Bioinformatics (Oxford, England)</source>
+      <year iso-8601-date="2018-03-01">2018</year><month>03</month><day>01</day>
+      <volume>34</volume>
+      <issue>5</issue>
+      <issn>1367-4811</issn>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/btx699</pub-id>
+      <fpage>867</fpage>
+      <lpage>868</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-regalado20_combining">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Regalado</surname><given-names>Julian</given-names></name>
+        <name><surname>Lundberg</surname><given-names>Derek S.</given-names></name>
+        <name><surname>Deusch</surname><given-names>Oliver</given-names></name>
+        <name><surname>Kersten</surname><given-names>Sonja</given-names></name>
+        <name><surname>Karasov</surname><given-names>Talia</given-names></name>
+        <name><surname>Poersch</surname><given-names>Karin</given-names></name>
+        <name><surname>Shirsekar</surname><given-names>Gautam</given-names></name>
+        <name><surname>Weigel</surname><given-names>Detlef</given-names></name>
+      </person-group>
+      <article-title>Combining whole-genome shotgun sequencing and rRNA gene amplicon analyses to improve detection of microbe–microbe interaction networks in plant leaves</article-title>
+      <source>The ISME Journal</source>
+      <publisher-name>Nature Publishing Group</publisher-name>
+      <year iso-8601-date="2020-08">2020</year><month>08</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-05-29">2023</year><month>05</month><day>29</day></date-in-citation>
+      <volume>14</volume>
+      <issue>8, 8</issue>
+      <issn>1751-7370</issn>
+      <uri>https://www.nature.com/articles/s41396-020-0665-8</uri>
+      <pub-id pub-id-type="doi">10.1038/s41396-020-0665-8</pub-id>
+      <fpage>2116</fpage>
+      <lpage>2130</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-schubert16_adapterremoval">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Schubert</surname><given-names>Mikkel</given-names></name>
+        <name><surname>Lindgreen</surname><given-names>Stinus</given-names></name>
+        <name><surname>Orlando</surname><given-names>Ludovic</given-names></name>
+      </person-group>
+      <article-title>AdapterRemoval v2: Rapid adapter trimming, identification, and read merging</article-title>
+      <source>BMC Research Notes</source>
+      <year iso-8601-date="2016">2016</year>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2016-06-07">2016</year><month>06</month><day>07</day></date-in-citation>
+      <volume>9</volume>
+      <issn>1756-0500</issn>
+      <uri>http://dx.doi.org/10.1186/s13104-016-1900-2</uri>
+      <pub-id pub-id-type="doi">10.1186/s13104-016-1900-2</pub-id>
+      <fpage>88</fpage>
+      <lpage></lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-sedlazeck13_nextgenmapfast">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Sedlazeck</surname><given-names>Fritz J.</given-names></name>
+        <name><surname>Rescheneder</surname><given-names>Philipp</given-names></name>
+        <name><surname>Von Haeseler</surname><given-names>Arndt</given-names></name>
+      </person-group>
+      <article-title>NextGenMap: Fast and accurate read mapping in highly polymorphic genomes</article-title>
+      <source>Bioinformatics</source>
+      <year iso-8601-date="2013-11-01">2013</year><month>11</month><day>01</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-04">2023</year><month>10</month><day>04</day></date-in-citation>
+      <volume>29</volume>
+      <issue>21</issue>
+      <issn>1367-4803</issn>
+      <uri>https://academic.oup.com/bioinformatics/article/29/21/2790/195626</uri>
+      <pub-id pub-id-type="doi">10.1093/bioinformatics/btt468</pub-id>
+      <fpage>2790</fpage>
+      <lpage>2791</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-wood19_improved">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Wood</surname><given-names>Derrick E.</given-names></name>
+        <name><surname>Lu</surname><given-names>Jennifer</given-names></name>
+        <name><surname>Langmead</surname><given-names>Ben</given-names></name>
+      </person-group>
+      <article-title>Improved metagenomic analysis with Kraken 2</article-title>
+      <source>Genome Biology</source>
+      <publisher-name>BioMed Central</publisher-name>
+      <year iso-8601-date="2019-12">2019</year><month>12</month>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-09">2023</year><month>10</month><day>09</day></date-in-citation>
+      <volume>20</volume>
+      <issue>1, 1</issue>
+      <issn>1474-760X</issn>
+      <uri>https://genomebiology.biomedcentral.com/articles/10.1186/s13059-019-1891-0</uri>
+      <pub-id pub-id-type="doi">10.1186/s13059-019-1891-0</pub-id>
+      <fpage>1</fpage>
+      <lpage>13</lpage>
+    </element-citation>
+  </ref>
+  <ref id="ref-yates23_nfcore">
+    <element-citation publication-type="article-journal">
+      <person-group person-group-type="author">
+        <name><surname>Yates</surname><given-names>James A. Fellows</given-names></name>
+        <name><surname>Stamouli</surname><given-names>Sofia</given-names></name>
+        <name><surname>Andersson-Li</surname><given-names>Lili</given-names></name>
+        <name><surname>Beber</surname><given-names>Moritz E.</given-names></name>
+        <name><surname>Mesilaakso</surname><given-names>Lauri</given-names></name>
+        <string-name>Nf-Core Bot</string-name>
+        <name><surname>Christensen</surname><given-names>Thomas A.</given-names></name>
+        <string-name>Mahwash Jamy</string-name>
+        <string-name>JIANHONG OU</string-name>
+        <name><surname>Stepien</surname><given-names>Rafal</given-names></name>
+        <name><surname>Borry</surname><given-names>Maxime</given-names></name>
+        <string-name>Husen M. Umer</string-name>
+        <name><surname>Syme</surname><given-names>Robert</given-names></name>
+        <name><surname>Hübner</surname><given-names>Alex</given-names></name>
+        <string-name>Zandra Fagernäs</string-name>
+      </person-group>
+      <article-title>Nf-core/taxprofiler</article-title>
+      <year iso-8601-date="2023-09-19">2023</year><month>09</month><day>19</day>
+      <date-in-citation content-type="access-date"><year iso-8601-date="2023-10-09">2023</year><month>10</month><day>09</day></date-in-citation>
+      <uri>https://zenodo.org/record/7728364</uri>
+      <pub-id pub-id-type="doi">10.5281/ZENODO.7728364</pub-id>
+    </element-citation>
+  </ref>
+</ref-list>
+</back>
+</article>
diff --git a/joss.06062/10.21105.joss.06062.pdf b/joss.06062/10.21105.joss.06062.pdf
new file mode 100644
index 0000000000..09fb2071de
Binary files /dev/null and b/joss.06062/10.21105.joss.06062.pdf differ