# HG changeset patch
# User nml
# Date 1757703040 0
# Node ID a91455432cd4358207285b9eeee082d300e82e56
# Parent d4a96287909e55e0779bd38ae4571302860dbd7e
planemo upload for repository https://github.com/phac-nml/CryptoGenotyper commit fdca1f95a5d09edf00bddd42286b68fcb20fa981
diff -r d4a96287909e -r a91455432cd4 cryptogenotyper.xml
--- a/cryptogenotyper.xml Fri Oct 16 22:32:56 2020 +0000
+++ b/cryptogenotyper.xml Fri Sep 12 18:50:40 2025 +0000
@@ -3,7 +3,7 @@
classifies Cryptosporidium species subtypes based on SSU rRNA and gp60 gene markers from Sanger sequencing data.
- 1.0
+ 1.5.0
cryptogenotyper
@@ -15,20 +15,23 @@
#set $ref_file=''
#if $db
- ln -s '${db}' '${db.name}' &&
+ ln -sf '${db}' '${db.name}' &&
#set $ref_file = $db.name
#end if
#if $primers['seqtype'] == 'contig'
- ln -s '${$primers.abi_input['forward']}' '${primers.abi_input.name}_forward.ab1' &&
- ln -s '${$primers.abi_input['reverse']}' '${primers.abi_input.name}_reverse.ab1' &&
+ #set $forward_name=$primers.input.forward.name.rsplit('.', 1)[0]
+ #set $reverse_name=$primers.input.reverse.name.rsplit('.', 1)[0]
+ ln -sf '${$primers.input['forward']}' '${forward_name}_forward.${primers.input.forward.ext}' &&
+ ln -sf '${$primers.input['reverse']}' '${reverse_name}_reverse.${primers.input.reverse.ext}' &&
cryptogenotyper -i '.' -m '$marker' -t '$primers.seqtype' -f 'forward' -r 'reverse'
#if $db
--databasefile $ref_file
#end if
#else
- ln -s '${primers.abi_input}' '${primers.abi_input.element_identifier}' &&
- cryptogenotyper -i './${primers.abi_input.element_identifier}' -m '$marker' -t '$primers.seqtype'
+ #set $filename_no_ext=$primers.input.name.rsplit('.', 1)[0]
+ ln -sf '${primers.input}' '${filename_no_ext}.${primers.input.ext}' &&
+ cryptogenotyper -i './${primers.input.name}' -m '$marker' -t '$primers.seqtype'
#if $db
--databasefile $ref_file
#end if
@@ -39,57 +42,236 @@
-
+
-
+
-
+
-
+
-
+
-
+
+
-
-
+
+
+ primers['seqtype'] != 'contig'
+
+
+
+ primers['seqtype'] == 'contig'
+
+
+
+
+ primers['seqtype'] != 'contig'
+
+
+
+ primers['seqtype'] == 'contig'
+
+
+
+
+ show_log and primers['seqtype'] != 'contig'
+
+
+
+ show_log and primers['seqtype'] == 'contig'
+
+
-
-
-
+
+
+
+
+
+
+
+
+
-
-
-
-
-
-
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
@@ -98,30 +280,56 @@
**Syntax**
-CryptoGenotyper is a standalone tool to *in-silico* determine species and subtype based on SSU rRNA and gp60 markers.
-For more information please visit https://github.com/phac-nml/CryptoGenotyper.
+CryptoGenotyper is a standalone tool to *in-silico* determine species and subtype based on SSU rRNA (18S) and gp60 markers.
+
+**❗ Important:** To process **multiple input files** and generate **a single** combined report, please import and use the workflows available `here`_.
+
+.. _here: https://github.com/phac-nml/CryptoGenotyper/tree/main/CryptoGenotyper/GalaxyWorkflows
+
+
+For a tutorial on how to use CryptoGenotyper, please refer to the `official tutorial`_.
+
+For more information, please visit https://github.com/phac-nml/CryptoGenotyper.
+
+.. _official tutorial: https://github.com/phac-nml/CryptoGenotyper/blob/docs/docs/CryptoGenotyperTutorial-CrownCopyright.pdf
-----
**Input:**
-AB1 file(s) representing *Cryptosporidium's* SSU rRNA or gp60 locus (forward, reverse, or contig (forward and reverse paired-end reads)).
-Optional: A custom reference database in .fa file format, to be used during the homology search for *Cryptosporidium* classification.
+AB1 or FASTA file(s) representing Cryptosporidium's SSU rRNA (18S) or gp60 locus can be provided as single-end reads (either forward or reverse only) or as paired-end reads in contig mode (both a forward and a reverse read for each sample).
+
+Optional: A custom reference database of SSU rRNA or gp60 locus in .fasta file format, to be used during the homology search for *Cryptosporidium* classification.
**Output:**
-FASTA file containing the identification of the *Cryptosporidium* species/subtype and its corresponding sequence for each sample.
+A tabular report and a FASTA file containing the identification of the *Cryptosporidium* species/subtype and its corresponding sequence for each sample along with other relevant details.
+The gp60 subtyping is based on the `Deciphering a cryptic minefield: a guide to Cryptosporidium gp60 subtyping publication`_.
+
+.. _`Deciphering a cryptic minefield: a guide to Cryptosporidium gp60 subtyping publication`: https://doi.org/10.1016/j.crpvbd.2025.100257
+
- @misc{githubCryptoGenotyper,
- author = {Yanta C, Bessonov K, Robinson G, Troell K, Guy R},
+ @ARTICLE{githubCryptoGenotyper,
+ author = {Yanta, Christine A. and Bessonov, Kyrylo and Robinson, Guy and Troell, Karin and Guy, Rebecca A.},
title = {CryptoGenotyper: a new bioinformatics tool to enhance Cryptosporidium identification},
- publisher = {GitHub},
- journal = {GitHub repository},
- url = {https://github.com/phac-nml/CryptoGenotyper}
+ journal = {Food and waterborne parasitology},
+ year = {2021},
+ volume = {23},
+ url = {https://doi.org/10.1016/j.fawpar.2021.e00115}
}
+
+ @ARTICLE{RobinsonGp60,
+ author = {Robinson, Gillian and Chalmers, Rachel M. and Elwin, Kirsty and Guy, Richard A. and Bessonov, Konstantin and Troell, Kristina and Xiao, Lihua},
+ title = {Deciphering a cryptic minefield: A guide to Cryptosporidium gp60 subtyping},
+ journal = {Current Research in Parasitology and Vector-Borne Diseases},
+ year = {2025},
+ volume = {7},
+ url = {https://doi.org/10.1016/j.crpvbd.2025.100257}
+ }
+ }
diff -r d4a96287909e -r a91455432cd4 test-data/test_illumina_18S_F.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_illumina_18S_F.fasta Fri Sep 12 18:50:40 2025 +0000
@@ -0,0 +1,8 @@
+>M04527:274:000000000-DBMY7:1:1102:16042:18930 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
+>M04527:274:000000000-DBMY7:1:1101:20679:16373 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
+>M04527:274:000000000-DBMY7:1:1102:12557:11653 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTAG
+>M04527:274:000000000-DBMY7:1:1102:17887:8992 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
diff -r d4a96287909e -r a91455432cd4 test-data/test_illumina_18S_R.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_illumina_18S_R.fasta Fri Sep 12 18:50:40 2025 +0000
@@ -0,0 +1,8 @@
+>M04527:274:000000000-DBMY7:1:1102:16042:18930 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
+>M04527:274:000000000-DBMY7:1:1101:20679:16373 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
+>M04527:274:000000000-DBMY7:1:1102:12557:11653 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTAG
+>M04527:274:000000000-DBMY7:1:1102:17887:8992 1:N:0:20
+AGTGACAAGAAATAACAATACAGGACTTTTTGGTTTTGTAATTGGAATGAGTTAAGTATAAACCCCTTTACAAGTATCAATTGGAGGGCAAGTCTGGTGCCAGCAGCCGCGGTAATTCCAGCTCCAATAGCGTATATTAAAGTTGTTGCAGTTAAAAAGCTCGTAGTTGGATTTCTGTTAATAATTTATATAAAATATTTTGATGAATATTTATATAATATTAACATAATTCATATTACTATTTTTTTTTT
diff -r d4a96287909e -r a91455432cd4 test-data/test_illumina_gp60_F1.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_illumina_gp60_F1.fasta Fri Sep 12 18:50:40 2025 +0000
@@ -0,0 +1,5 @@
+>M04527:274:000000000-DBMY7:1:1102:14324:28396 1:N:0:26
+TCCGCTGTATTCTCAGCCCCAGCCGTTCCACTCAGAGGAACTTTAAAGGATGTTCCTGTTGAGGGCTCATCATCGTCATCGTCATCGTCATCATCATCATCATCATCATCATCATCATCATCAACATCAACCGTCGCACCAGCAAATAAGGCAAGAACTGGAGAAGACGCAGAAGGCAGTCAAGATTCTAGTGGTACTGAAGCTTCTGGTAGCCAGGGTTCTGAAGAGGAAGGTAGTGAAGACGATGGCCA
+>M04527:274:000000000-DBMY7:1:1102:20035:28200 1:N:0:26
+TCCGCTGTATTCTCAGCCCCTGCCGTTCCACTCAGAGGAACTTTAAAGGATGTTCCTGTTGAGGGCTCATCATCGTCATCGTCATCATCATCATCATCATCATCATCATCATCATCAACATCAACATCAACCGTCGCACCAGCAAATAAGGCAAGAACTGGAGAAGACGCAGAAGGCAGTCAAGATTCTAGTGGTACTGAAGCTTCTGGTAGCCAGGGTTCTGAAGAGGAAGGTAGTGAAGACGATGGCCA
+
diff -r d4a96287909e -r a91455432cd4 test-data/test_illumina_gp60_R1.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_illumina_gp60_R1.fasta Fri Sep 12 18:50:40 2025 +0000
@@ -0,0 +1,4 @@
+>M04527:274:000000000-DBMY7:1:1102:14324:28396 2:N:0:26
+CGAACCACATTACAAATGAAGTGCCGCATTCTTCTTTTGGAGTAGCTTCTATGGTTTCGGTAGTTGCGCCTTCACTTTGAGCTGGAGTAGTGGGTTGGGAAGCAGCACTAGTTTGGCCATCGTCTTCACTACCTTCCTCTTCAGAACCCTGGCTACCAGAAGCTTCAGTACCACTAGAATCTTGACTGCCTTCTGCGTCTTCTCCAGTTCTTGCCTTATTTGCTGGTGCGACGGTTGATGTTGATGATGAT
+>M04527:274:000000000-DBMY7:1:1102:20035:28200 2:N:0:26
+CGAACCACATTACAAATGAAGTGCCGCATTCTTCTTTTGGAGTAGCTTCTATGGTTTCGGTAGTTGCGCCTTCACTTTGAGCTGGAGTAGTGGGTTGGGAAGCAGCACTAGTTTGGCCATCGTCTTCACTACCTTCCTCTTCAGAACCCTGGCTACCAGAAGCTTCAGTACCACTAGAATCTTGACTGCCTTCTGCGTCTTCTCCAGTTCTTGCCTTATTTGCTGGTGCGACGGTTGATGTTGATGTTGAT
\ No newline at end of file