annotate mrfast-2.1.0.5/CommandLineParser.c @ 1:d4054b05b015 default tip

Version update to 2.1.0.5
author calkan
date Fri, 09 Mar 2012 07:35:51 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
1 /*
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
2 * Copyright (c) <2008 - 2012>, University of Washington, Simon Fraser University
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
3 * All rights reserved.
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
4 *
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
5 * Redistribution and use in source and binary forms, with or without modification,
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
6 * are permitted provided that the following conditions are met:
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
7 *
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
8 * Redistributions of source code must retain the above copyright notice, this list
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
9 * of conditions and the following disclaimer.
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
10 * - Redistributions in binary form must reproduce the above copyright notice, this
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
11 * list of conditions and the following disclaimer in the documentation and/or other
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
12 * materials provided with the distribution.
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
13 * - Neither the names of the University of Washington, Simon Fraser University,
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
14 * nor the names of its contributors may be
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
15 * used to endorse or promote products derived from this software without specific
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
16 * prior written permission.
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
17 *
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
22 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
23 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
24 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
25 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
26 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
27 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
28 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
29 */
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
30
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
31 /*
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
32 Authors:
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
33 Farhad Hormozdiari
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
34 Faraz Hach
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
35 Can Alkan
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
36 Emails:
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
37 farhadh AT uw DOT edu
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
38 fhach AT cs DOT sfu DOT ca
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
39 calkan AT uw DOT edu
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
40 */
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
41
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
42
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
43 #include <stdio.h>
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
44 #include <stdlib.h>
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
45 #include <getopt.h>
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
46 #include <string.h>
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
47 #include <ctype.h>
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
48 #include "Common.h"
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
49 #include "CommandLineParser.h"
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
50
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
51 int uniqueMode=1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
52 int indexingMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
53 int searchingMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
54 int pairedEndMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
55 int pairedEndDiscordantMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
56 int transChromosal=0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
57 int pairedEndProfilingMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
58 int seqCompressed;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
59 int outCompressed;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
60 int cropSize = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
61 int progressRep = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
62 int minPairEndedDistance=-1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
63 int maxPairEndedDistance=-1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
64 int minPairEndedDiscordantDistance=-1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
65 int maxPairEndedDiscordantDistance=-1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
66 int bestMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
67 int nosamMode;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
68 char *seqFile1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
69 char *seqFile2;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
70 char *mappingOutput = "output";
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
71 char *mappingOutputPath = "";
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
72 char *unmappedOutput = "unmapped";
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
73 char fileName[1000][2][FILE_NAME_LENGTH];
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
74 int fileCnt;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
75 int maxOEAOutput=100;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
76 int maxDiscordantOutput=300;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
77 unsigned char errThreshold=2;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
78 unsigned char maxHits=0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
79 unsigned char WINDOW_SIZE = 12;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
80 unsigned int CONTIG_SIZE;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
81 unsigned int CONTIG_MAX_SIZE;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
82
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
83 void printHelp();
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
84
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
85 int parseCommandLine (int argc, char *argv[])
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
86 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
87
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
88 int o;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
89 int index;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
90 char *fastaFile = NULL;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
91 char *batchFile = NULL ;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
92 int batchMode = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
93
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
94 static struct option longOptions[] =
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
95 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
96 {"pe", no_argument, &pairedEndMode, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
97 {"discordant-vh", no_argument, &pairedEndDiscordantMode, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
98 {"trans", no_argument, &transChromosal , 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
99 {"profile", no_argument, &pairedEndProfilingMode, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
100 {"seqcomp", no_argument, &seqCompressed, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
101 {"outcomp", no_argument, &outCompressed, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
102 {"progress", no_argument, &progressRep, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
103 {"best", no_argument, &bestMode, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
104 {"index", required_argument, 0, 'i'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
105 {"search", required_argument, 0, 's'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
106 {"help", no_argument, 0, 'h'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
107 {"version", no_argument, 0, 'v'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
108 {"seq", required_argument, 0, 'x'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
109 {"seq1", required_argument, 0, 'x'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
110 {"seq2", required_argument, 0, 'y'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
111 {"ws", required_argument, 0, 'w'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
112 {"min", required_argument, 0, 'l'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
113 {"max", required_argument, 0, 'm'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
114 {"crop", required_argument, 0, 'c'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
115 {"maxoea", required_argument, 0, 'a'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
116 {"maxdis", required_argument, 0, 'd'},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
117 {"nosam", no_argument, &nosamMode, 1},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
118 {0, 0, 0, 0},
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
119 };
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
120
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
121 while ( (o = getopt_long ( argc, argv, "bhvn:e:o:u:i:s:x:y:w:l:m:c:a:d:", longOptions, &index)) != -1 )
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
122 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
123 switch (o)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
124 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
125 case 'a':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
126 maxOEAOutput = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
127 if (maxOEAOutput == 0)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
128 maxOEAOutput = 100000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
129 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
130 case 'd':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
131 maxDiscordantOutput = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
132 if (maxDiscordantOutput == 0)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
133 maxDiscordantOutput = 100000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
134 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
135 case 'i':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
136 indexingMode = 1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
137 fastaFile = optarg;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
138 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
139 case 's':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
140 searchingMode = 1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
141 fastaFile = optarg;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
142 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
143 case 'b':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
144 batchMode = 1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
145 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
146 case 'c':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
147 cropSize = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
148 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
149 case 'w':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
150 WINDOW_SIZE = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
151 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
152 case 'x':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
153 seqFile1 = optarg;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
154 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
155 case 'y':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
156 seqFile2 = optarg;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
157 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
158 case 'u':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
159 unmappedOutput = optarg;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
160 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
161 case 'o':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
162 mappingOutput = getMem(FILE_NAME_LENGTH);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
163 mappingOutputPath = getMem(FILE_NAME_LENGTH);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
164 stripPath (optarg, &mappingOutputPath, &mappingOutput);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
165 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
166 case 'n':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
167 maxHits = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
168 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
169 case 'e':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
170 errThreshold = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
171 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
172 case 'l':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
173 minPairEndedDistance = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
174 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
175 case 'm':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
176 maxPairEndedDistance = atoi(optarg);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
177 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
178 case 'h':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
179 printHelp();
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
180 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
181 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
182 case 'v':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
183 fprintf(stdout, "%s.%s\n", versionNumber, versionNumberF);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
184 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
185 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
186 /* case '?':
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
187 fprintf(stderr, "Unknown parameter: %s\n", longOptions[index].name);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
188 abort();
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
189 break;*/
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
190 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
191
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
192 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
193 if (indexingMode + searchingMode != 1)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
194 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
195 fprintf(stdout, "ERROR: Indexing / Searching mode should be selected\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
196 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
197 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
198
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
199 if (WINDOW_SIZE > 15 || WINDOW_SIZE < 11)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
200 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
201 fprintf(stdout, "ERROR: Window size should be in [12..15]\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
202 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
203 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
204
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
205
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
206 if ( indexingMode )
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
207 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
208 CONTIG_SIZE = 15000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
209 CONTIG_MAX_SIZE = 40000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
210
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
211 if (batchMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
212 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
213 batchFile = fastaFile;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
214 fastaFile = NULL;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
215 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
216
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
217 if (batchFile == NULL && fastaFile == NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
218 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
219 fprintf(stdout, "ERROR: Reference(s) should be indicated for indexing\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
220 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
221 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
222
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
223 if (pairedEndDiscordantMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
224 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
225 fprintf(stdout, "ERROR: --discordant-vh cannot be used in indexing mode. \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
226 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
227 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
228
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
229 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
230
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
231
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
232 if ( searchingMode )
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
233 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
234 CONTIG_SIZE = 300000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
235 CONTIG_MAX_SIZE = 300000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
236
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
237
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
238 if (batchMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
239 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
240 batchFile = fastaFile;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
241 fastaFile = NULL;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
242 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
243
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
244 if (batchFile == NULL && fastaFile == NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
245 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
246 fprintf(stdout, "ERROR: Index File(s) should be indiciated for searching\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
247 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
248 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
249
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
250 if (seqFile1 == NULL && seqFile2 == NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
251 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
252 fprintf(stdout, "ERROR: Please indicate a sequence file for searching.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
253 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
254 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
255
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
256
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
257 if (!pairedEndMode && seqFile2 != NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
258 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
259 fprintf(stdout, "ERROR: Second File can be indicated in pairedend mode\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
260 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
261 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
262
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
263 if (pairedEndMode && (minPairEndedDistance <0 || maxPairEndedDistance < 0 || minPairEndedDistance > maxPairEndedDistance))
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
264 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
265 fprintf(stdout, "ERROR: Please enter a valid range for pairedend sequences.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
266 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
267 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
268
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
269 if (pairedEndMode && seqFile1 == NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
270 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
271 fprintf(stdout, "ERROR: Please indicate the first file for pairedend search.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
272 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
273 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
274
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
275 if (!pairedEndMode && pairedEndDiscordantMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
276 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
277 fprintf(stdout, "ERROR: --discordant should be used with --pe");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
278 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
279 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
280
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
281 if (!pairedEndMode && pairedEndProfilingMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
282 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
283 fprintf(stdout, "ERROR: --profile should be used with --pe");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
284 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
285 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
286
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
287 if (pairedEndMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
288 pairedEndDiscordantMode = 1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
289 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
290
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
291 int i = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
292
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
293
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
294 if (batchMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
295 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
296 FILE *fp = fileOpen(batchFile, "r");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
297
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
298 if (fp == NULL)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
299 return 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
300
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
301 fileCnt = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
302
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
303 while ( fgets(fileName[fileCnt][0], FILE_NAME_LENGTH, fp))
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
304 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
305 for (i = strlen(fileName[fileCnt][0])-1; i>=0; i--)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
306 if ( !isspace(fileName[fileCnt][0][i]))
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
307 break;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
308 fileName[fileCnt][0][i+1] = '\0';
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
309
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
310 if (strcmp(fileName[fileCnt][0], "") != 0)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
311 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
312 sprintf(fileName[fileCnt][1], "%s.index", fileName[fileCnt][0]);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
313 fileCnt++;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
314 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
315 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
316 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
317 else
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
318 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
319 sprintf(fileName[fileCnt][0], "%s", fastaFile);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
320 sprintf(fileName[fileCnt][1], "%s.index", fileName[fileCnt][0]);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
321 fileCnt++;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
322 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
323
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
324
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
325 if (pairedEndProfilingMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
326 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
327
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
328 minPairEndedDistance = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
329 maxPairEndedDistance = 300000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
330
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
331 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
332
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
333 if (pairedEndDiscordantMode)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
334 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
335 minPairEndedDiscordantDistance = minPairEndedDistance;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
336 maxPairEndedDiscordantDistance = maxPairEndedDistance;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
337
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
338 minPairEndedDistance = 0;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
339 maxPairEndedDistance = 300000000;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
340 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
341
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
342 return 1;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
343 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
344
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
345
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
346 void printHelp()
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
347 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
348 char *errorType;
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
349 if (mrFAST)
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
350 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
351 fprintf(stdout,"mrFAST : Micro-Read Fast Alignment Search Tool.\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
352 fprintf(stdout,"Usage: mrfast [options]\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
353 errorType="edit distance";
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
354 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
355 else
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
356 {
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
357 fprintf(stdout,"mrsFAST : Micro-Read Substitutions (only) Fast Alignment Search Tool.\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
358 fprintf(stdout,"mrsFAST is a cache oblivious read mapping tool. mrsFAST capable of mapping\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
359 fprintf(stdout,"single and paired end reads to the reference genome. Bisulfite treated \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
360 fprintf(stdout,"sequences are not supported in this version. By default mrsFAST reports \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
361 fprintf(stdout,"the output in SAM format.\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
362 fprintf(stdout,"Usage: mrsFAST [options]\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
363 errorType="hamming distance";
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
364 }
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
365
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
366 fprintf(stdout,"General Options:\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
367 fprintf(stdout," -v|--version\t\tCurrent Version.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
368 fprintf(stdout," -h\t\t\tShows the help file.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
369 fprintf(stdout,"\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
370
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
371 fprintf(stdout,"Indexing Options:\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
372 fprintf(stdout," --index [file]\t\tGenerate an index from the specified fasta file. \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
373 fprintf(stdout," -b\t\t\tIndicates the indexing will be done in batch mode.\n\t\t\tThe file specified in --index should contain the \n\t\t\tlist of fasta files.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
374 fprintf(stdout," --ws [int]\t\tSet window size for indexing (default:12 max:14).\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
375 fprintf(stdout,"\n\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
376
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
377 fprintf(stdout,"Searching Options:\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
378 fprintf(stdout," --search [file]\tSearch in the specified genome. Provide the path to the fasta file. \n\t\t\tIndex file should be in the same directory.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
379 fprintf(stdout," -b\t\t\tIndicates the mapping will be done in batch mode. \n\t\t\tThe file specified in --search should contain the \n\t\t\tlist of fasta files.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
380 fprintf(stdout," --pe \t\t\tSearch will be done in Paired-End mode.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
381 fprintf(stdout," --seq [file]\t\tInput sequences in fasta/fastq format [file]. If \n\t\t\tpaired end reads are interleaved, use this option.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
382 fprintf(stdout," --seq1 [file]\t\tInput sequences in fasta/fastq format [file] (First \n\t\t\tfile). Use this option to indicate the first file of \n\t\t\tpaired end reads. \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
383 fprintf(stdout," --seq2 [file]\t\tInput sequences in fasta/fastq format [file] (Second \n\t\t\tfile). Use this option to indicate the second file of \n\t\t\tpaired end reads. \n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
384 fprintf(stdout," -o [file]\t\tOutput of the mapped sequences. The default is \"output\".\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
385 fprintf(stdout," -u [file]\t\tSave unmapped sequences in fasta/fastq format.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
386 fprintf(stdout," --best \t\tOnly the best mapping from all the possible mapping is returned.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
387 fprintf(stdout," --seqcomp \t\tIndicates that the input sequences are compressed (gz).\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
388 fprintf(stdout," --outcomp \t\tIndicates that output file should be compressed (gz).\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
389 fprintf(stdout," -e [int]\t\tMaximum allowed %s (default 2).\n", errorType);
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
390 fprintf(stdout," --min [int]\t\tMin distance allowed between a pair of end sequences.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
391 fprintf(stdout," --max [int]\t\tMax distance allowed between a pair of end sequences.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
392
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
393 fprintf(stdout," --maxoea [int]\t\tMax number of One End Anchored (OEA) returned for each read pair. We recommend 100 or above for NovelSeq use.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
394 fprintf(stdout," --maxdis [int]\t\tMax number of discordant map locations returned for each read pair. We recommend 300 or above for VariationHunter use.\n");
d4054b05b015 Version update to 2.1.0.5
calkan
parents:
diff changeset
395 }