Mercurial > repos > yufei-luo > s_mart
annotate smart_toolShed/SMART/Java/Python/modifyFasta.py @ 0:e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
| author | yufei-luo | 
|---|---|
| date | Thu, 17 Jan 2013 10:52:14 -0500 | 
| parents | |
| children | 
| rev | line source | 
|---|---|
| 
0
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
1 #! /usr/bin/env python | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
2 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
3 # Copyright INRA-URGI 2009-2010 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
4 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
5 # This software is governed by the CeCILL license under French law and | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
6 # abiding by the rules of distribution of free software. You can use, | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
7 # modify and/ or redistribute the software under the terms of the CeCILL | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
8 # license as circulated by CEA, CNRS and INRIA at the following URL | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
9 # "http://www.cecill.info". | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
10 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
11 # As a counterpart to the access to the source code and rights to copy, | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
12 # modify and redistribute granted by the license, users are provided only | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
13 # with a limited warranty and the software's author, the holder of the | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
14 # economic rights, and the successive licensors have only limited | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
15 # liability. | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
16 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
17 # In this respect, the user's attention is drawn to the risks associated | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
18 # with loading, using, modifying and/or developing or reproducing the | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
19 # software by the user in light of its specific status of free software, | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
20 # that may mean that it is complicated to manipulate, and that also | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
21 # therefore means that it is reserved for developers and experienced | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
22 # professionals having in-depth computer knowledge. Users are therefore | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
23 # encouraged to load and test the software's suitability as regards their | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
24 # requirements in conditions enabling the security of their systems and/or | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
25 # data to be ensured and, more generally, to use and operate it in the | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
26 # same conditions as regards security. | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
27 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
28 # The fact that you are presently reading this means that you have had | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
29 # knowledge of the CeCILL license and that you accept its terms. | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
30 # | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
31 """Modify the content of a FASTA file""" | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
32 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
33 from optparse import OptionParser | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
34 from commons.core.parsing.FastaParser import FastaParser | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
35 from commons.core.writer.FastaWriter import FastaWriter | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
36 from SMART.Java.Python.misc.Progress import Progress | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
37 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
38 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
39 if __name__ == "__main__": | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
40 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
41 # parse command line | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
42 description = "Modify Sequence List v1.0.1: Extend or shring a list of sequences. [Category: Data Modification]" | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
43 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
44 parser = OptionParser(description = description) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
45 parser.add_option("-i", "--input", dest="inputFileName", action="store", type="string", help="input file [compulsory] [format: file in FASTA format]") | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
46 parser.add_option("-o", "--output", dest="outputFileName", action="store", default=None, type="string", help="output file [compulsory] [format: output file in FASTA format]") | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
47 parser.add_option("-s", "--start", dest="start", action="store", default=None, type="int", help="keep first nucleotides [format: int]") | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
48 parser.add_option("-e", "--end", dest="end", action="store", default=None, type="int", help="keep last nucleotides [format: int]") | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
49 parser.add_option("-v", "--verbosity", dest="verbosity", action="store", default=1, type="int", help="trace level [format: int]") | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
50 (options, args) = parser.parse_args() | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
51 | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
52 parser = FastaParser(options.inputFileName, options.verbosity) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
53 writer = FastaWriter(options.outputFileName, options.verbosity) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
54 progress = Progress(parser.getNbSequences(), "Reading file %s" % (options.inputFileName), options.verbosity) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
55 for sequence in parser.getIterator(): | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
56 if options.start != None: | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
57 sequence.shrinkToFirstNucleotides(options.start) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
58 if options.end != None: | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
59 sequence.shrinkToLastNucleotides(options.end) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
60 writer.addSequence(sequence) | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
61 progress.inc() | 
| 
 
e0f8dcca02ed
Uploaded S-MART tool. A toolbox manages RNA-Seq and ChIP-Seq data.
 
yufei-luo 
parents:  
diff
changeset
 | 
62 progress.done() | 
