# HG changeset patch # User iuc # Date 1536332359 14400 # Node ID 518ba4a77274bfcb52606667f4d3dfea5a6ffea4 # Parent 7d8138b4a593279cf6509685e3fb0c3dfd70abc1 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/khmer commit e0cd7ae10ce97bed51594e7cc0b969a803d698b7 diff -r 7d8138b4a593 -r 518ba4a77274 filter-below-abund.py --- a/filter-below-abund.py Sat Jan 21 14:43:04 2017 -0500 +++ b/filter-below-abund.py Fri Sep 07 10:59:19 2018 -0400 @@ -38,11 +38,10 @@ import os import sys -import khmer -from khmer.thread_utils import ThreadedSequenceProcessor, verbose_fasta_iter +import screed +from khmer import Countgraph, ReadParser +from khmer.utils import (broken_paired_reader, write_record) -WORKER_THREADS = 8 -GROUPSIZE = 100 CUTOFF = 50 @@ -51,12 +50,9 @@ infiles = sys.argv[2:] print('file with ht: %s' % counting_ht) - print('-- settings:') - print('N THREADS', WORKER_THREADS) - print('--') print('making hashtable') - ht = khmer.load_countgraph(counting_ht) + ht = Countgraph.load(counting_ht) K = ht.ksize() for infile in infiles: @@ -65,22 +61,18 @@ outfp = open(outfile, 'w') - def process_fn(record, ht=ht): - name = record['name'] - seq = record['sequence'] + paired_iter = broken_paired_reader(ReadParser(infile), min_length=K, + force_single=True) + for n, is_pair, read1, read2 in paired_iter: + name = read1.name + seq = read1.sequence if 'N' in seq: return None, None trim_seq, trim_at = ht.trim_below_abundance(seq, CUTOFF) if trim_at >= K: - return name, trim_seq - - return None, None - - tsp = ThreadedSequenceProcessor(process_fn, WORKER_THREADS, GROUPSIZE) - - tsp.start(verbose_fasta_iter(infile), outfp) + write_record(screed.Record(name=name, sequence=trim_seq), outfp) if __name__ == '__main__': diff -r 7d8138b4a593 -r 518ba4a77274 macros.xml --- a/macros.xml Sat Jan 21 14:43:04 2017 -0500 +++ b/macros.xml Fri Sep 07 10:59:19 2018 -0400 @@ -1,9 +1,7 @@ - 2.0 + 3.0.0a1 - bz2file - screed khmer @@ -47,7 +45,7 @@ - @@ -93,31 +91,7 @@ - @article{khmer2015, - author = "Crusoe, Michael R. and Alameldin, Hussien F. and Awad, Sherine - and Bucher, Elmar and Caldwell, Adam and Cartwright, Reed and Charbonneau, - Amanda and Constantinides, Bede and Edvenson, Greg and Fay, Scott and Fenton, - Jacob and Fenzl, Thomas and Fish, Jordan and Garcia-Gutierrez, Leonor and - Garland, Phillip and Gluck, Jonathan and González, Iván and Guermond, Sarah - and Guo, Jiarong and Gupta, Aditi and Herr, Joshua R. and Howe, Adina and - Hyer, Alex and Härpfer, Andreas and Irber, Luiz and Kidd, Rhys and Lin, David - and Lippi, Justin and Mansour, Tamer and McA'Nulty, Pamela and McDonald, Eric - and Mizzi, Jessica and Murray, Kevin D. and Nahum, Joshua R. and Nanlohy, - Kaben and Nederbragt, Alexander Johan and Ortiz-Zuazaga, Humberto and Ory, - Jeramia and Pell, Jason and Pepe-Ranney, Charles and Russ, Zachary N and - Schwarz, Erich and Scott, Camille and Seaman, Josiah and Sievert, Scott and - Simpson, Jared and Skennerton, Connor T. and Spencer, James and Srinivasan, - Ramakrishnan and Standage, Daniel and Stapleton, James A. and Stein, Joe and - Steinman, Susan R and Taylor, Benjamin and Trimble, Will and Wiencko, Heather - L. and Wright, Michael and Wyss, Brian and Zhang, Qingpeng and zyme, en and - Brown, C. Titus" - title = "The khmer software package: enabling efficient nucleotide - sequence analysis", - year = "2015", - month = "08", - publisher = "F1000", - url = "http://dx.doi.org/10.12688/f1000research.6924.1" - } + 10.12688/f1000research.6924.1 @unpublished{diginorm, @@ -130,19 +104,7 @@ url = "http://arxiv.org/abs/1203.4802", } - @article{Pell2012, - doi = {10.1073/pnas.1121464109}, - url = {http://dx.doi.org/10.1073/pnas.1121464109}, - year = {2012}, - month = {jul}, - publisher = {Proceedings of the National Academy of Sciences}, - volume = {109}, - number = {33}, - pages = {13272--13277}, - author = {J. Pell and A. Hintze and R. Canino-Koning and A. Howe and J. M. Tiedje and C. T. Brown}, - title = {Scaling metagenome sequence assembly with probabilistic de Bruijn graphs}, - journal = {Proceedings of the National Academy of Sciences} - } + 10.1073/pnas.1121464109 10.1371/journal.pone.0101271 diff -r 7d8138b4a593 -r 518ba4a77274 tool_dependencies.xml --- a/tool_dependencies.xml Sat Jan 21 14:43:04 2017 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,12 +0,0 @@ - - - - - - - - - - - -