Mercurial > repos > iuc > qiime_extract_barcodes
comparison generate_test_data.sh @ 0:c7eeac78cb64 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qiime/ commit 3b54163c4f7daff76fcc589c4a9057bb03904380
author | iuc |
---|---|
date | Sat, 05 Aug 2017 07:28:39 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:c7eeac78cb64 |
---|---|
1 #!/usr/bin/env bash | |
2 | |
3 # Data are from test data in https://github.com/biocore/qiime | |
4 | |
5 # align_seqs | |
6 align_seqs.py \ | |
7 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
8 -o 'align_seqs_pynast_uclust' \ | |
9 --alignment_method 'pynast' \ | |
10 --pairwise_alignment_method 'uclust' \ | |
11 --template_fp 'test-data/align_seqs/core_set_aligned.fasta.imputed' \ | |
12 --min_percent_id '0.75' | |
13 | |
14 align_seqs.py \ | |
15 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
16 -o 'align_seqs_pynast_muscle' \ | |
17 --alignment_method 'pynast' \ | |
18 --pairwise_alignment_method 'muscle' \ | |
19 --min_length '50' \ | |
20 --min_percent_id '0.75' | |
21 | |
22 align_seqs.py \ | |
23 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
24 -o 'align_seqs_pynast_pair_hmm' \ | |
25 --alignment_method 'pynast' \ | |
26 --pairwise_alignment_method 'pair_hmm' \ | |
27 --min_percent_id '0.75' | |
28 | |
29 #align_seqs.py \ | |
30 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
31 # -o 'align_seqs_pynast_clustal' \ | |
32 # --alignment_method 'pynast' \ | |
33 # --pairwise_alignment_method 'clustal' \ | |
34 # --min_percent_id '0.75' | |
35 | |
36 align_seqs.py \ | |
37 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
38 -o 'align_seqs_pynast_blast' \ | |
39 --alignment_method 'pynast' \ | |
40 --pairwise_alignment_method 'blast' \ | |
41 --min_percent_id '0.75' | |
42 | |
43 align_seqs.py \ | |
44 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
45 -o 'align_seqs_pynast_mafft' \ | |
46 --alignment_method 'pynast' \ | |
47 --pairwise_alignment_method 'mafft' \ | |
48 --min_percent_id '0.75' | |
49 | |
50 #align_seqs.py \ | |
51 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
52 # -o 'align_seqs_infernal' \ | |
53 # --alignment_method 'infernal' \ | |
54 # --template_fp 'test-data/align_seqs/seed.16s.reference_model.sto' \ | |
55 # --min_percent_id '0.75' | |
56 | |
57 #align_seqs.py \ | |
58 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
59 # -o 'align_seqs_clustalw' \ | |
60 # --alignment_method 'clustalw' \ | |
61 # --min_percent_id '0.75' | |
62 | |
63 align_seqs.py \ | |
64 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
65 -o 'align_seqs_muscle' \ | |
66 --alignment_method 'muscle' \ | |
67 --min_percent_id '0.75' | |
68 | |
69 align_seqs.py \ | |
70 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
71 -o 'align_seqs_mafft' \ | |
72 --alignment_method 'mafft' \ | |
73 --min_percent_id '0.75' | |
74 | |
75 #alpha_rarefaction | |
76 alpha_rarefaction.py \ | |
77 --otu_table_fp "test-data/alpha_rarefaction/otu_table.biom" \ | |
78 --mapping_fp "test-data/alpha_rarefaction/mapping_file.txt" \ | |
79 -o alpha_rarefaction \ | |
80 --num_steps '2' \ | |
81 --tree_fp "test-data/alpha_rarefaction/rep_set.tre" \ | |
82 --min_rare_depth '10' \ | |
83 --max_rare_depth '50' \ | |
84 --retain_intermediate_files | |
85 rm -rf alpha_rarefaction | |
86 | |
87 # assign_taxonomy | |
88 assign_taxonomy.py \ | |
89 --input_fasta_fp 'test-data/assign_taxonomy/uclust_input_seqs.fasta' \ | |
90 --assignment_method 'uclust' \ | |
91 --min_consensus_fraction '0.51' \ | |
92 --similarity '0.9' \ | |
93 --uclust_max_accepts '3' \ | |
94 -o assign_taxonomy_uclust | |
95 ls assign_taxonomy_uclust | |
96 md5sum 'assign_taxonomy_uclust/uclust_input_seqs_tax_assignments.txt' | |
97 rm -rf assign_taxonomy_uclust | |
98 | |
99 assign_taxonomy.py \ | |
100 --input_fasta_fp 'test-data/assign_taxonomy/mothur_repr_set_seqs.fasta' \ | |
101 --id_to_taxonomy_fp 'test-data/assign_taxonomy/mothur_id_to_taxonomy.txt' \ | |
102 --assignment_method 'mothur' \ | |
103 --reference_seqs_fp 'test-data/assign_taxonomy/mothur_ref_seq_set.fna' \ | |
104 --confidence '0.5' \ | |
105 -o assign_taxonomy_mothur | |
106 ls assign_taxonomy_mothur | |
107 md5sum 'assign_taxonomy_mothur/mothur_repr_set_seqs_tax_assignments.txt' | |
108 rm -rf assign_taxonomy_mothur | |
109 | |
110 assign_taxonomy.py \ | |
111 --input_fasta_fp 'test-data/assign_taxonomy/mothur_repr_set_seqs.fasta' \ | |
112 --id_to_taxonomy_fp 'test-data/assign_taxonomy/mothur_id_to_taxonomy.txt' \ | |
113 --assignment_method 'mothur' \ | |
114 --reference_seqs_fp 'test-data/assign_taxonomy/mothur_ref_seq_set.fna' \ | |
115 --blast_e_value '0.001' \ | |
116 -o assign_taxonomy_blast | |
117 ls assign_taxonomy_blast | |
118 md5sum 'assign_taxonomy_blast/mothur_repr_set_seqs_tax_assignments.txt' | |
119 rm -rf assign_taxonomy_blast | |
120 | |
121 #assign_taxonomy.py \ | |
122 # --input_fasta_fp 'test-data/assign_taxonomy/rdp_input_seqs.fasta' \ | |
123 # --id_to_taxonomy_fp 'test-data/assign_taxonomy/rdp_id_to_taxonomy.txt' \ | |
124 # --assignment_method 'rdp' \ | |
125 # --confidence '3' \ | |
126 # -o assign_taxonomy_rdp | |
127 | |
128 #assign_taxonomy.py \ | |
129 # --input_fasta_fp 'test-data/assign_taxonomy/rtax_ref_seq_set.fna' \ | |
130 # --id_to_taxonomy_fp 'test-data/assign_taxonomy/rtax_id_to_taxonomy.txt' \ | |
131 # --assignment_method 'rtax' \ | |
132 # --read_1_seqs_fp 'test-data/assign_taxonomy/read_1.seqs.fna' \ | |
133 # --read_2_seqs_fp 'test-data/assign_taxonomy/read_2.seqs.fna' \ | |
134 # --single_ok \ | |
135 # --no_single_ok_generic \ | |
136 # --read_id_regex "\S+\s+(\S+)" \ | |
137 # --amplicon_id_regex "(\S+)\s+(\S+?)\/" \ | |
138 # --header_id_regex "\S+\s+(\S+?)\/" \ | |
139 # -o assign_taxonomy_rtax | |
140 #ls assign_taxonomy_rtax | |
141 | |
142 assign_taxonomy.py \ | |
143 --input_fasta_fp 'test-data/assign_taxonomy/mothur_ref_seq_set.fna' \ | |
144 --assignment_method 'sortmerna' \ | |
145 --min_consensus_fraction "0.51" \ | |
146 --similarity "0.9" \ | |
147 --sortmerna_e_value "1.0" \ | |
148 --sortmerna_coverage "0.9" \ | |
149 --sortmerna_best_N_alignments "5" \ | |
150 -o assign_taxonomy_sortmerna | |
151 ls assign_taxonomy_sortmerna | |
152 md5sum 'assign_taxonomy_sortmerna/mothur_ref_seq_set_tax_assignments.txt' | |
153 md5sum 'assign_taxonomy_sortmerna/sortmerna_map.blast' | |
154 rm -rf assign_taxonomy_sortmerna | |
155 | |
156 #beta_diversity | |
157 beta_diversity.py \ | |
158 --input_path 'test-data/beta_diversity/otu_table.biom' \ | |
159 -o beta_diversity_1 \ | |
160 --metrics 'unweighted_unifrac,weighted_unifrac' \ | |
161 --tree_path 'test-data/beta_diversity/rep_set.tre' | |
162 md5 'beta_diversity_1/unweighted_unifrac_otu_table.txt' | |
163 md5 'beta_diversity_1/weighted_unifrac_otu_table.txt' | |
164 rm -rf beta_diversity_1 | |
165 | |
166 beta_diversity.py \ | |
167 --input_path 'test-data/beta_diversity/otu_table.biom' \ | |
168 -o beta_diversity_2 \ | |
169 --metrics 'abund_jaccard,binary_chisq,binary_chord,binary_euclidean,binary_hamming,binary_jaccard,binary_lennon,binary_ochiai,binary_pearson,binary_sorensen_dice,bray_curtis,canberra,chisq,chord,euclidean,gower,hellinger,kulczynski,manhattan,morisita_horn,pearson,soergel,spearman_approx,specprof,unifrac_g,unifrac_g_full_tree,unweighted_unifrac,unweighted_unifrac_full_tree,weighted_normalized_unifrac,weighted_unifrac' \ | |
170 --tree_path 'test-data/beta_diversity/rep_set.tre' | |
171 md5 'beta_diversity_2/canberra_otu_table.txt' | |
172 md5 'beta_diversity_2/pearson_otu_table.txt' | |
173 rm -rf beta_diversity_2 | |
174 | |
175 #beta_diversity_through_plots | |
176 beta_diversity_through_plots.py \ | |
177 --otu_table_fp 'test-data/beta_diversity_through_plots/otu_table.biom' \ | |
178 --mapping_fp 'test-data/beta_diversity_through_plots/map.txt' \ | |
179 --output_dir beta_diversity_through_plots \ | |
180 --tree_fp 'test-data/beta_diversity_through_plots/rep_set.tre' \ | |
181 --parallel | |
182 cp beta_diversity_through_plots/unweighted_unifrac_dm.txt 'test-data/beta_diversity_through_plots/' | |
183 cp beta_diversity_through_plots/unweighted_unifrac_pc.txt 'test-data/beta_diversity_through_plots/' | |
184 cp beta_diversity_through_plots/weighted_unifrac_dm.txt 'test-data/beta_diversity_through_plots/' | |
185 cp beta_diversity_through_plots/weighted_unifrac_pc.txt 'test-data/beta_diversity_through_plots/' | |
186 rm -rf beta_diversity_through_plots | |
187 | |
188 # compare_categories | |
189 compare_categories.py \ | |
190 --method 'adonis' \ | |
191 --input_dm 'test-data/compare_categories/unweighted_unifrac_dm.txt' \ | |
192 --mapping_file 'test-data/compare_categories/map.txt' \ | |
193 --categories 'Treatment' \ | |
194 -o compare_categories_1 \ | |
195 --num_permutations '999' | |
196 cp compare_categories_1/adonis_results.txt "test-data/compare_categories/adonis_results.txt" | |
197 rm -rf compare_categories_1 | |
198 | |
199 compare_categories.py \ | |
200 --method 'dbrda' \ | |
201 --input_dm 'test-data/compare_categories/unweighted_unifrac_dm.txt' \ | |
202 --mapping_file 'test-data/compare_categories/map.txt' \ | |
203 --categories 'Treatment' \ | |
204 -o compare_categories_2 \ | |
205 --num_permutations '99' | |
206 cp compare_categories_2/* "test-data/compare_categories/" | |
207 rm -rf compare_categories_2 | |
208 | |
209 # core_diversity_analyses | |
210 core_diversity_analyses.py \ | |
211 --input_biom_fp 'test-data/core_diversity_analyses/otu_table.biom' \ | |
212 -o core_diversity_analyses_1 \ | |
213 --mapping_fp 'test-data/core_diversity_analyses/map.txt' \ | |
214 --sampling_depth 22 \ | |
215 --tree_fp 'test-data/core_diversity_analyses/rep_set.tre' | |
216 cp core_diversity_analyses_1/bdiv_even22/unweighted_unifrac_pc.txt 'test-data/core_diversity_analyses/unweighted_unifrac_pc.txt' | |
217 rm -rf core_diversity_analyses_1 | |
218 | |
219 core_diversity_analyses.py \ | |
220 --input_biom_fp 'test-data/core_diversity_analyses/otu_table.biom' \ | |
221 -o core_diversity_analyses_2 \ | |
222 --mapping_fp 'test-data/core_diversity_analyses/map.txt' \ | |
223 --sampling_depth 22 \ | |
224 --nonphylogenetic_diversity \ | |
225 --suppress_taxa_summary \ | |
226 --suppress_beta_diversity \ | |
227 --suppress_alpha_diversity \ | |
228 --suppress_group_significance | |
229 rm -rf core_diversity_analyses_2 | |
230 | |
231 # extract_barcodes | |
232 extract_barcodes.py \ | |
233 --fastq1 'test-data/extract_barcodes/inseqs.fastq' \ | |
234 --input_type 'barcode_single_end' \ | |
235 -o extract_barcodes_1 \ | |
236 --bc1_len '6' \ | |
237 --rev_comp_bc1 | |
238 rm -rf extract_barcodes_1 | |
239 | |
240 extract_barcodes.py \ | |
241 --fastq1 'test-data/extract_barcodes/inseqs_R1.fastq' \ | |
242 --input_type 'barcode_paired_end' \ | |
243 --fastq2 'test-data/extract_barcodes/inseqs_R2.fastq' \ | |
244 -o extract_barcodes_2 \ | |
245 --bc1_len '6' \ | |
246 --bc2_len '6' | |
247 rm -rf extract_barcodes_2 | |
248 | |
249 extract_barcodes.py \ | |
250 --fastq1 'test-data/extract_barcodes/inseqs_R1.fastq' \ | |
251 --input_type 'barcode_paired_end' \ | |
252 --fastq2 'test-data/extract_barcodes/inseqs_R2.fastq' \ | |
253 -o extract_barcodes_3 \ | |
254 --bc1_len '6' \ | |
255 --bc2_len '6' \ | |
256 --mapping_fp 'test-data/extract_barcodes/mapping_data.txt' \ | |
257 --attempt_read_reorientation \ | |
258 --disable_header_match | |
259 rm -rf extract_barcodes_3 | |
260 | |
261 extract_barcodes.py \ | |
262 --fastq1 'test-data/extract_barcodes/inseqs_R1.fastq' \ | |
263 --input_type 'barcode_paired_stitched' \ | |
264 -o extract_barcodes_4 \ | |
265 --bc1_len '6' \ | |
266 --bc2_len '8' \ | |
267 --rev_comp_bc1 \ | |
268 --rev_comp_bc2 | |
269 rm -rf extract_barcodes_4 | |
270 | |
271 extract_barcodes.py \ | |
272 --fastq1 'test-data/extract_barcodes/inseqs_R1.fastq' \ | |
273 --input_type 'barcode_in_label' \ | |
274 --char_delineator '#' \ | |
275 -o extract_barcodes_5 \ | |
276 --bc1_len '6' | |
277 rm -rf extract_barcodes_5 | |
278 | |
279 # filter_alignment | |
280 filter_alignment.py \ | |
281 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
282 -o 'filter_alignment_default' \ | |
283 --allowed_gap_frac '0.999999' \ | |
284 --threshold '3.0' | |
285 | |
286 filter_alignment.py \ | |
287 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
288 -o 'filter_alignment_without_mask_filter_and_outliers' \ | |
289 --suppress_lane_mask_filter \ | |
290 --allowed_gap_frac '0.999999' \ | |
291 --remove_outliers \ | |
292 --threshold '3.0' | |
293 | |
294 filter_alignment.py \ | |
295 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
296 -o 'filter_alignment_entropy' \ | |
297 --allowed_gap_frac '0.999999' \ | |
298 --threshold '3.0' \ | |
299 --entropy_threshold '0.1' | |
300 | |
301 # filter_fasta | |
302 filter_fasta.py \ | |
303 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
304 --output_fasta_fp 'filter_fasta_otu_map.fasta' \ | |
305 --otu_map 'test-data/filter_fasta/otu_map.txt' | |
306 | |
307 filter_fasta.py \ | |
308 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
309 --output_fasta_fp 'filter_fasta_otu_map_negate.fasta' \ | |
310 --otu_map 'test-data/filter_fasta/otu_map.txt' \ | |
311 --negate | |
312 | |
313 filter_fasta.py \ | |
314 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
315 --output_fasta_fp 'filter_fasta_seq_id.fasta' \ | |
316 --seq_id_fp 'test-data/filter_fasta/seqs_to_keep.txt' | |
317 | |
318 filter_fasta.py \ | |
319 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
320 --output_fasta_fp 'filter_fasta_otu_table.fasta' \ | |
321 --biom_fp 'test-data/filter_fasta/otu_table.biom' | |
322 | |
323 filter_fasta.py \ | |
324 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
325 --output_fasta_fp 'filter_fasta_subject_fasta.fasta' \ | |
326 --subject_fasta_fp 'test-data/filter_fasta/sl_inseqs.fasta' | |
327 | |
328 filter_fasta.py \ | |
329 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
330 --output_fasta_fp 'filter_fasta_seq_id_prefix.fasta' \ | |
331 --seq_id_prefix 'S5' | |
332 | |
333 filter_fasta.py \ | |
334 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
335 --output_fasta_fp 'filter_fasta_sample_id.fasta' \ | |
336 --sample_id_fp 'test-data/filter_fasta/map.txt' | |
337 | |
338 # filter_otus_from_otu_table | |
339 filter_otus_from_otu_table.py \ | |
340 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
341 --min_count '2' \ | |
342 --max_count '1000' \ | |
343 --min_samples '5' \ | |
344 --max_samples '350' \ | |
345 --output_fp 'test-data/filter_otus_from_otu_table/filtered_otu_table.biom' | |
346 | |
347 filter_otus_from_otu_table.py \ | |
348 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
349 --otu_ids_to_exclude_fp 'test-data/filter_otus_from_otu_table/chimeric_otus.txt' \ | |
350 --output_fp 'test-data/filter_otus_from_otu_table/chimera_filtered_otu_table.biom' | |
351 | |
352 filter_otus_from_otu_table.py \ | |
353 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
354 --otu_ids_to_exclude_fp 'test-data/filter_otus_from_otu_table/chimeric_otus.txt' \ | |
355 --negate_ids_to_exclude \ | |
356 --output_fp 'test-data/filter_otus_from_otu_table/chimera_picked_otu_table.biom' | |
357 | |
358 # filter_samples_from_otu_table | |
359 filter_samples_from_otu_table.py \ | |
360 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
361 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
362 --min_count '150' | |
363 biom convert \ | |
364 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
365 -o 'test-data/filter_samples_from_otu_table/abundance_min.biom' \ | |
366 --to-json | |
367 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
368 | |
369 filter_samples_from_otu_table.py \ | |
370 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
371 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
372 --min_count '0' \ | |
373 --max_count '149' | |
374 biom convert \ | |
375 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
376 -o 'test-data/filter_samples_from_otu_table/abundance_max.biom' \ | |
377 --to-json | |
378 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
379 | |
380 filter_samples_from_otu_table.py \ | |
381 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
382 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
383 --mapping_fp 'test-data/filter_samples_from_otu_table/map.txt' \ | |
384 --output_mapping_fp 'test-data/filter_samples_from_otu_table/metadata_positive.txt' \ | |
385 -s 'Treatment:Control' | |
386 biom convert \ | |
387 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
388 -o 'test-data/filter_samples_from_otu_table/metadata_positive.biom' \ | |
389 --to-json | |
390 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
391 | |
392 filter_samples_from_otu_table.py \ | |
393 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
394 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
395 --mapping_fp 'test-data/filter_samples_from_otu_table/map.txt' \ | |
396 -s 'Treatment:*,!Control' | |
397 biom convert \ | |
398 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
399 -o 'test-data/filter_samples_from_otu_table/metadata_negative.biom' \ | |
400 --to-json | |
401 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
402 | |
403 filter_samples_from_otu_table.py \ | |
404 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
405 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
406 --sample_id_fp 'test-data/filter_samples_from_otu_table/ids.txt' | |
407 biom convert \ | |
408 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
409 -o 'test-data/filter_samples_from_otu_table/id_positive.biom' \ | |
410 --to-json | |
411 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
412 | |
413 filter_samples_from_otu_table.py \ | |
414 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
415 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
416 --sample_id_fp 'test-data/filter_samples_from_otu_table/ids.txt' \ | |
417 --negate_sample_id_fp | |
418 biom convert \ | |
419 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
420 -o 'test-data/filter_samples_from_otu_table/id_negative.biom' \ | |
421 --to-json | |
422 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
423 | |
424 # filter_taxa_from_otu_table | |
425 filter_taxa_from_otu_table.py \ | |
426 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
427 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
428 --positive_taxa 'p__Bacteroidetes,p__Firmicutes' \ | |
429 --metadata_field 'taxonomy' | |
430 biom convert \ | |
431 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
432 -o 'test-data/filter_taxa_from_otu_table/positive_taxa.biom' \ | |
433 --to-json | |
434 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
435 | |
436 filter_taxa_from_otu_table.py \ | |
437 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
438 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
439 --negative_taxa 'p__Bacteroidetes,p__Firmicutes' \ | |
440 --metadata_field 'taxonomy' | |
441 biom convert \ | |
442 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
443 -o 'test-data/filter_taxa_from_otu_table/negative_taxa.biom' \ | |
444 --to-json | |
445 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
446 | |
447 filter_taxa_from_otu_table.py \ | |
448 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
449 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
450 --positive_taxa 'p__Firmicutes' \ | |
451 --negative_taxa 'c__Clostridia' \ | |
452 --metadata_field 'taxonomy' | |
453 biom convert \ | |
454 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
455 -o 'test-data/filter_taxa_from_otu_table/positive_negative_taxa.biom' \ | |
456 --to-json | |
457 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
458 | |
459 # jackknifed_beta_diversity | |
460 jackknifed_beta_diversity.py \ | |
461 --otu_table_fp 'test-data/jackknifed_beta_diversity/otu_table.biom' \ | |
462 --mapping_fp 'test-data/jackknifed_beta_diversity/map.txt' \ | |
463 -o jackknifed_beta_diversity \ | |
464 --seqs_per_sample '10' \ | |
465 --tree_fp 'test-data/jackknifed_beta_diversity/rep_set.tre' \ | |
466 --master_tree 'consensus' \ | |
467 --parallel | |
468 rm -rf jackknifed_beta_diversity | |
469 | |
470 # make_emperor | |
471 cp 'test-data/core_diversity_analyses/unweighted_unifrac_pc.txt' 'test-data/make_emperor/unweighted_unifrac_pc.txt' | |
472 cp 'test-data/core_diversity_analyses/map.txt' 'test-data/make_emperor/map.txt' | |
473 cp 'test-data/summarize_taxa/2_L3.txt' 'test-data/make_emperor/2_L3.txt' | |
474 | |
475 make_emperor.py \ | |
476 --input_coords 'test-data/make_emperor/unweighted_unifrac_pc.txt' \ | |
477 -o make_emperor_1 \ | |
478 --map_fp 'test-data/make_emperor/map.txt' \ | |
479 --number_of_axes '10' \ | |
480 --add_unique_columns \ | |
481 --number_of_segments 8 | |
482 rm -rf make_emperor_1 | |
483 | |
484 make_emperor.py \ | |
485 --input_coords 'test-data/make_emperor/unweighted_unifrac_pc.txt' \ | |
486 -o make_emperor_2 \ | |
487 --map_fp 'test-data/make_emperor/map.txt' \ | |
488 --number_of_axes '10' \ | |
489 --add_unique_columns \ | |
490 --number_of_segments 8 \ | |
491 --taxa_fp 'test-data/make_emperor/2_L3.txt' \ | |
492 --n_taxa_to_keep 10 | |
493 rm -rf make_emperor_2 | |
494 | |
495 # make_otu_heatmap | |
496 make_otu_heatmap.py \ | |
497 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
498 --imagetype 'pdf' \ | |
499 --color_scheme "YlGn" \ | |
500 --width "5" \ | |
501 --height "5" \ | |
502 --dpi "200" \ | |
503 --obs_md_category "taxonomy" \ | |
504 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.pdf' | |
505 | |
506 make_otu_heatmap.py \ | |
507 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
508 --imagetype 'png' \ | |
509 --color_scheme "YlGn" \ | |
510 --width "5" \ | |
511 --height "5" \ | |
512 --dpi "200" \ | |
513 --obs_md_category "taxonomy" \ | |
514 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.png' | |
515 | |
516 make_otu_heatmap.py \ | |
517 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
518 --imagetype 'svg' \ | |
519 --color_scheme "YlGn" \ | |
520 --width "5" \ | |
521 --height "5" \ | |
522 --dpi "200" \ | |
523 --obs_md_category "taxonomy" \ | |
524 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.svg' | |
525 | |
526 make_otu_heatmap.py \ | |
527 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
528 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
529 --imagetype 'pdf' \ | |
530 --color_scheme "YlGn" \ | |
531 --width "5" \ | |
532 --height "5" \ | |
533 --dpi "200" \ | |
534 --obs_md_category "taxonomy" \ | |
535 --output_fp 'test-data/make_otu_heatmap/sample_sorted_heatmap.pdf' | |
536 | |
537 make_otu_heatmap.py \ | |
538 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
539 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
540 --otu_tree 'test-data/make_otu_heatmap/rep_set.tre' \ | |
541 --imagetype 'pdf' \ | |
542 --color_scheme "YlGn" \ | |
543 --width "5" \ | |
544 --height "5" \ | |
545 --dpi "200" \ | |
546 --obs_md_category "taxonomy" \ | |
547 --output_fp 'test-data/make_otu_heatmap/sample_otu_sorted_heatmap.pdf' | |
548 | |
549 make_otu_heatmap.py \ | |
550 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
551 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
552 --category "Treatment" \ | |
553 --imagetype 'pdf' \ | |
554 --color_scheme "YlGn" \ | |
555 --width "5" \ | |
556 --height "5" \ | |
557 --dpi "200" \ | |
558 --obs_md_category "taxonomy" \ | |
559 --output_fp 'test-data/make_otu_heatmap/treatment_sample_sorted_heatmap.pdf' | |
560 | |
561 # make_phylogeny | |
562 make_phylogeny.py \ | |
563 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
564 --result_fp 'test-data/make_phylogeny/fasttree_tree_method_default.tre' \ | |
565 --tree_method 'fasttree' \ | |
566 --log_fp 'fasttree_tree_method_default.txt' \ | |
567 --root_method 'tree_method_default' | |
568 | |
569 make_phylogeny.py \ | |
570 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
571 --result_fp 'raxml_v730.tre' \ | |
572 --tree_method 'raxml_v730' \ | |
573 --log_fp 'raxml_v730.txt' \ | |
574 --root_method 'tree_method_default' | |
575 | |
576 make_phylogeny.py \ | |
577 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
578 --result_fp 'test-data/make_phylogeny/muscle.tre' \ | |
579 --tree_method 'muscle' \ | |
580 --log_fp 'muscle.txt' \ | |
581 --root_method 'tree_method_default' | |
582 | |
583 make_phylogeny.py \ | |
584 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
585 --result_fp 'test-data/make_phylogeny/clustalw.tre' \ | |
586 --tree_method 'clustalw' \ | |
587 --log_fp 'clustalw.txt' \ | |
588 --root_method 'tree_method_default' | |
589 | |
590 make_phylogeny.py \ | |
591 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
592 --result_fp 'clearcut.tre' \ | |
593 --tree_method 'clearcut' \ | |
594 --log_fp 'clearcut.txt' \ | |
595 --root_method 'tree_method_default' | |
596 | |
597 make_phylogeny.py \ | |
598 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
599 --result_fp 'test-data/make_phylogeny/fasttree_midpoint.tre' \ | |
600 --tree_method 'fasttree' \ | |
601 --log_fp 'fasttree_midpoint.txt' \ | |
602 --root_method 'midpoint' | |
603 | |
604 # multiple_join_paired_ends | |
605 multiple_join_paired_ends.py \ | |
606 --input_dir 'test-data/multiple_join_paired_ends/without_barcode/' \ | |
607 --output_dir 'test-data/multiple_join_paired_ends/output_without_barcode' \ | |
608 --read1_indicator 'forward_' \ | |
609 --read2_indicator 'reverse_' \ | |
610 --leading_text '' \ | |
611 --trailing_text '' | |
612 | |
613 #multiple_join_paired_ends.py \ | |
614 # --input_dir 'test-data/multiple_join_paired_ends/without_barcode/' \ | |
615 # --output_dir 'multiple_join_paired_ends_without_barcode_parameter_files' \ | |
616 # --parameter_fp 'test-data/multiple_join_paired_ends/qiime_parameters.txt' \ | |
617 # --read1_indicator '_R1_' \ | |
618 # --read2_indicator '_R2_' \ | |
619 # --leading_text '' \ | |
620 # --trailing_text '' | |
621 | |
622 multiple_join_paired_ends.py \ | |
623 --input_dir 'test-data/multiple_join_paired_ends/with_barcode/' \ | |
624 --output_dir 'test-data/multiple_join_paired_ends/output_with_barcode' \ | |
625 --read1_indicator 'forward_' \ | |
626 --read2_indicator 'reverse_' \ | |
627 --match_barcodes \ | |
628 --barcode_indicator 'barcode_' \ | |
629 --leading_text '' \ | |
630 --trailing_text '' | |
631 | |
632 # multiple_split_libraries_fastq | |
633 multiple_split_libraries_fastq.py \ | |
634 --input_dir 'test-data/multiple_split_libraries_fastq/input' \ | |
635 --output_dir 'multiple_split_libraries_fastq' \ | |
636 --demultiplexing_method 'mapping_barcode_files' \ | |
637 --read_indicator 'reads_' \ | |
638 --barcode_indicator 'barcodes_' \ | |
639 --mapping_indicator 'mapping_' \ | |
640 --mapping_extensions 'txt' \ | |
641 --leading_text '' \ | |
642 --trailing_text '' \ | |
643 --sampleid_indicator '.' | |
644 | |
645 multiple_split_libraries_fastq.py \ | |
646 --input_dir 'test-data/multiple_split_libraries_fastq/input' \ | |
647 --output_dir 'multiple_split_libraries_fastq_with_parameter_file' \ | |
648 --demultiplexing_method 'mapping_barcode_files' \ | |
649 --parameter_fp 'test-data/multiple_split_libraries_fastq/qiime_parameters.txt' \ | |
650 --read_indicator 'reads_' \ | |
651 --barcode_indicator 'barcodes_' \ | |
652 --mapping_indicator 'mapping_' \ | |
653 --mapping_extensions 'txt' \ | |
654 --leading_text '' \ | |
655 --trailing_text '' \ | |
656 --sampleid_indicator '.' | |
657 | |
658 # pick_closed_reference_otus | |
659 pick_closed_reference_otus.py \ | |
660 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
661 --output_dir 'pick_closed_reference_otus' \ | |
662 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
663 --taxonomy_fp 'test-data/pick_closed_reference_otus/taxa.txt' | |
664 biom convert \ | |
665 -i 'pick_closed_reference_otus/otu_table.biom' \ | |
666 -o 'test-data/pick_closed_reference_otus/basic_otu_table.biom' \ | |
667 --to-json | |
668 | |
669 pick_closed_reference_otus.py \ | |
670 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
671 --output_dir 'pick_closed_reference_otus_sortmerna' \ | |
672 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
673 --taxonomy_fp 'test-data/pick_closed_reference_otus/taxa.txt' \ | |
674 --parameter_fp 'test-data/pick_closed_reference_otus/sortmerna_params.txt' | |
675 biom convert \ | |
676 -i 'pick_closed_reference_otus_sortmerna/otu_table.biom' \ | |
677 -o 'test-data/pick_closed_reference_otus/sortmerna_otu_table.biom' \ | |
678 --to-json | |
679 | |
680 pick_closed_reference_otus.py \ | |
681 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
682 --output_dir 'pick_closed_reference_otus_assign_taxonomy' \ | |
683 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
684 --assign_taxonomy | |
685 biom convert \ | |
686 -i 'pick_closed_reference_otus_assign_taxonomy/otu_table.biom' \ | |
687 -o 'test-data/pick_closed_reference_otus/assign_taxonomy_otu_table.biom' \ | |
688 --to-json | |
689 | |
690 pick_closed_reference_otus.py \ | |
691 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
692 --output_dir 'pick_closed_reference_otus_suppress_taxonomy_assignment' \ | |
693 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
694 --suppress_taxonomy_assignment | |
695 biom convert \ | |
696 -i 'pick_closed_reference_otus_suppress_taxonomy_assignment/otu_table.biom' \ | |
697 -o 'test-data/pick_closed_reference_otus/suppress_taxonomy_assignment_otu_table.biom' \ | |
698 --to-json | |
699 | |
700 # pick_open_reference_otus | |
701 pick_open_reference_otus.py \ | |
702 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
703 -o pick_open_reference_otus_1 \ | |
704 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
705 --otu_picking_method 'uclust' \ | |
706 --new_ref_set_id 'New' \ | |
707 --parallel \ | |
708 --percent_subsample '0.001' \ | |
709 --prefilter_percent_id '0.0' \ | |
710 --minimum_failure_threshold '100000' \ | |
711 --min_otu_size '2' | |
712 cp pick_open_reference_otus_1/final_otu_map.txt 'test-data/pick_open_reference_otus/1_final_otu_map.txt' | |
713 cp pick_open_reference_otus_1/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/1_final_otu_map_mc.txt' | |
714 cp pick_open_reference_otus_1/rep_set.tre 'test-data/pick_open_reference_otus/1_rep_set_tree.tre' | |
715 rm -rf pick_open_reference_otus_1 | |
716 | |
717 pick_open_reference_otus.py \ | |
718 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
719 -o pick_open_reference_otus_2 \ | |
720 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
721 --otu_picking_method 'uclust' \ | |
722 --new_ref_set_id 'New' \ | |
723 --parallel \ | |
724 --percent_subsample '0.001' \ | |
725 --prefilter_percent_id '0.0' \ | |
726 --minimum_failure_threshold '100000' \ | |
727 --min_otu_size '3' \ | |
728 --suppress_taxonomy_assignment \ | |
729 --suppress_align_and_tree | |
730 cp pick_open_reference_otus_2/final_otu_map.txt 'test-data/pick_open_reference_otus/2_final_otu_map.txt' | |
731 cp pick_open_reference_otus_2/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/2_final_otu_map_mc.txt' | |
732 rm -rf pick_open_reference_otus_2 | |
733 | |
734 pick_open_reference_otus.py \ | |
735 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
736 -o pick_open_reference_otus_3 \ | |
737 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
738 --otu_picking_method 'uclust' \ | |
739 --new_ref_set_id 'New' \ | |
740 --parallel \ | |
741 --percent_subsample '0.001' \ | |
742 --prefilter_percent_id '0.0' \ | |
743 --minimum_failure_threshold '100000' \ | |
744 --min_otu_size '10' \ | |
745 --suppress_taxonomy_assignment | |
746 cp pick_open_reference_otus_3/final_otu_map.txt 'test-data/pick_open_reference_otus/3_final_otu_map.txt' | |
747 cp pick_open_reference_otus_3/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/3_final_otu_map_mc.txt' | |
748 cp pick_open_reference_otus_3/rep_set.tre 'test-data/pick_open_reference_otus/3_rep_set_tree.tre' | |
749 rm -rf pick_open_reference_otus_3 | |
750 | |
751 # pick_otus | |
752 pick_otus.py \ | |
753 -i 'test-data/pick_otus/seqs.fna' \ | |
754 -o 'pick_otus_uclust' \ | |
755 --otu_picking_method 'uclust' \ | |
756 --similarity "0.97" \ | |
757 --denovo_otu_id_prefix "denovo" \ | |
758 --max_accepts "1" \ | |
759 --max_rejects "8" \ | |
760 --stepwords "8" \ | |
761 --word_length "8" \ | |
762 --non_chimeras_retention "union" | |
763 | |
764 pick_otus.py \ | |
765 -i 'test-data/pick_otus/seqs.fna' \ | |
766 -o 'pick_otus_sortmerna' \ | |
767 --otu_picking_method "sortmerna" \ | |
768 --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
769 --sortmerna_e_value "1" \ | |
770 --sortmerna_coverage "0.97" \ | |
771 --sortmerna_tabular \ | |
772 --sortmerna_best_N_alignments "1" \ | |
773 --sortmerna_max_pos "10000" \ | |
774 --similarity "0.97" \ | |
775 --non_chimeras_retention "union" | |
776 | |
777 #pick_otus.py \ | |
778 # -i 'test-data/pick_otus/seqs.fna' \ | |
779 # -o 'pick_otus_mothur' \ | |
780 # --otu_picking_method "mothur" \ | |
781 # --clustering_algorithm "furthest" \ | |
782 # --non_chimeras_retention "union" | |
783 | |
784 pick_otus.py \ | |
785 -i 'test-data/pick_otus/seqs.fna' \ | |
786 -o 'pick_otus_trie' \ | |
787 --otu_picking_method "trie" \ | |
788 --non_chimeras_retention "union" | |
789 | |
790 pick_otus.py \ | |
791 -i 'test-data/pick_otus/seqs.fna' \ | |
792 -o 'pick_otus_uclust_ref' \ | |
793 --otu_picking_method "uclust_ref" \ | |
794 --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
795 --similarity "0.97" \ | |
796 --max_accepts "1" \ | |
797 --max_rejects "8" \ | |
798 --stepwords "8" \ | |
799 --word_length "8" \ | |
800 --non_chimeras_retention "union" | |
801 | |
802 #pick_otus.py \ | |
803 # -i 'test-data/pick_otus/seqs.fna' \ | |
804 # -o 'pick_otus_blast' \ | |
805 # --otu_picking_method "blast" \ | |
806 # --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
807 # --similarity "0.97" \ | |
808 # --max_e_value_blast "1e-10" \ | |
809 # --min_aligned_percent "0.5" \ | |
810 # --non_chimeras_retention "union" | |
811 | |
812 # pick_otus.py \ | |
813 # -i 'test-data/pick_otus/seqs.fna' \ | |
814 # -o 'pick_otus_sumaclust' \ | |
815 # --otu_picking_method "sumaclust" \ | |
816 # --similarity "0.97" \ | |
817 # --sumaclust_l \ | |
818 # --denovo_otu_id_prefix "denovo" \ | |
819 # --non_chimeras_retention "union" | |
820 | |
821 pick_otus.py \ | |
822 -i 'test-data/pick_otus/seqs.fna' \ | |
823 -o 'pick_otus_swarm' \ | |
824 --otu_picking_method "swarm" \ | |
825 --denovo_otu_id_prefix "denovo" \ | |
826 --swarm_resolution "1" \ | |
827 --non_chimeras_retention "union" | |
828 | |
829 pick_otus.py \ | |
830 -i 'test-data/pick_otus/seqs.fna' \ | |
831 -o 'pick_otus_prefix_suffix' \ | |
832 --otu_picking_method "prefix_suffix" \ | |
833 --prefix_length "50" \ | |
834 --suffix_length "50" \ | |
835 --non_chimeras_retention "union" | |
836 | |
837 pick_otus.py \ | |
838 -i 'test-data/pick_otus/seqs.fna' \ | |
839 -o 'pick_otus_cdhit' \ | |
840 --otu_picking_method "cdhit" \ | |
841 --similarity "0.97" \ | |
842 --non_chimeras_retention "union" | |
843 | |
844 pick_otus.py \ | |
845 -i 'test-data/pick_otus/seqs.fna' \ | |
846 -o 'pick_otus_uclust_intersection' \ | |
847 --otu_picking_method "uclust" \ | |
848 --similarity "0.97" \ | |
849 --denovo_otu_id_prefix "denovo" \ | |
850 --max_accepts "1" \ | |
851 --max_rejects "8" \ | |
852 --stepwords "8" \ | |
853 --word_length "8" \ | |
854 --non_chimeras_retention "intersection" | |
855 | |
856 # pick_rep_set | |
857 pick_rep_set.py \ | |
858 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
859 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
860 --rep_set_picking_method 'first' \ | |
861 --sort_by 'otu' \ | |
862 --result_fp 'test-data/pick_rep_set/first_otu_fasta.fasta' \ | |
863 --log_fp 'test-data/pick_rep_set/first_otu_fasta.txt' | |
864 | |
865 pick_rep_set.py \ | |
866 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
867 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
868 --reference_seqs_fp 'test-data/pick_rep_set/refseqs.fasta' \ | |
869 --rep_set_picking_method 'first' \ | |
870 --sort_by 'otu' \ | |
871 --result_fp 'test-data/pick_rep_set/first_otu_fasta_ref.fasta' \ | |
872 --log_fp 'test-data/pick_rep_set/first_otu_fasta_ref.txt' | |
873 | |
874 pick_rep_set.py \ | |
875 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
876 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
877 --rep_set_picking_method 'longest' \ | |
878 --sort_by 'otu' \ | |
879 --result_fp 'test-data/pick_rep_set/longest_otu_fasta.fasta' \ | |
880 --log_fp 'test-data/pick_rep_set/longest_otu_fasta.txt' | |
881 | |
882 pick_rep_set.py \ | |
883 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
884 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
885 --rep_set_picking_method 'most_abundant' \ | |
886 --sort_by 'otu' \ | |
887 --result_fp 'test-data/pick_rep_set/most_abundant_otu_fasta.fasta' \ | |
888 --log_fp 'test-data/pick_rep_set/most_abundant_otu_fasta.txt' | |
889 | |
890 pick_rep_set.py \ | |
891 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
892 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
893 --rep_set_picking_method 'random' \ | |
894 --sort_by 'otu' \ | |
895 --result_fp 'test-data/pick_rep_set/random_otu_fasta.fasta' \ | |
896 --log_fp 'test-data/pick_rep_set/random_otu_fasta.txt' | |
897 | |
898 pick_rep_set.py \ | |
899 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
900 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
901 --rep_set_picking_method 'first' \ | |
902 --sort_by 'seq_id' \ | |
903 --result_fp 'test-data/pick_rep_set/first_seq_id_fasta.fasta' \ | |
904 --log_fp 'test-data/pick_rep_set/first_seq_id_fasta.txt' | |
905 | |
906 # plot_taxa_summary | |
907 plot_taxa_summary.py \ | |
908 --counts_fname 'test-data/plot_taxa_summary/phylum.txt' \ | |
909 --dir_path 'test-data/plot_taxa_summary/phylum' \ | |
910 --labels 'phylum' \ | |
911 --num_categories '20' \ | |
912 --background_color 'white' \ | |
913 --dpi '80' \ | |
914 --x_width '12' \ | |
915 --y_height '12' \ | |
916 --bar_width '0.75' \ | |
917 --type_of_file 'png' \ | |
918 --chart_type 'area,bar,pie' \ | |
919 --resize_nth_label '0' \ | |
920 --label_type 'categorical' | |
921 | |
922 plot_taxa_summary.py \ | |
923 --counts_fname 'test-data/plot_taxa_summary/phylum.txt,test-data/plot_taxa_summary/class.txt,test-data/plot_taxa_summary/genus.txt' \ | |
924 --dir_path 'test-data/plot_taxa_summary/phylum_class_genus' \ | |
925 --labels 'Phylum,Class,Genus' \ | |
926 --num_categories '20' \ | |
927 --background_color 'white' \ | |
928 --dpi '80' \ | |
929 --x_width '12' \ | |
930 --y_height '12' \ | |
931 --bar_width '0.75' \ | |
932 --type_of_file 'png' \ | |
933 --chart_type 'area,bar,pie' \ | |
934 --resize_nth_label '0' \ | |
935 --label_type 'categorical' | |
936 | |
937 plot_taxa_summary.py \ | |
938 --counts_fname 'test-data/plot_taxa_summary/class.txt' \ | |
939 --dir_path 'test-data/plot_taxa_summary/class' \ | |
940 --labels 'Class' \ | |
941 --num_categories '10' \ | |
942 --background_color 'white' \ | |
943 --dpi '80' \ | |
944 --x_width '12' \ | |
945 --y_height '12' \ | |
946 --bar_width '0.75' \ | |
947 --chart_type 'pie' \ | |
948 --type_of_file 'svg' \ | |
949 --include_html_legend \ | |
950 --resize_nth_label '0' \ | |
951 --label_type 'categorical' | |
952 | |
953 plot_taxa_summary.py \ | |
954 --counts_fname 'test-data/plot_taxa_summary/class.txt' \ | |
955 --dir_path 'test-data/plot_taxa_summary/class_colorby' \ | |
956 --labels 'Class' \ | |
957 --num_categories '20' \ | |
958 --colorby 'PC.636,PC.635' \ | |
959 --background_color 'white' \ | |
960 --dpi '80' \ | |
961 --x_width '12' \ | |
962 --y_height '12' \ | |
963 --bar_width '0.75' \ | |
964 --type_of_file 'pdf' \ | |
965 --chart_type 'area,bar,pie' \ | |
966 --resize_nth_label '0' \ | |
967 --label_type 'categorical' | |
968 | |
969 # split_libraries | |
970 split_libraries.py \ | |
971 --map 'test-data/split_libraries/mapping_file.txt' \ | |
972 -o split_libraries \ | |
973 --fasta 'test-data/split_libraries/reads_1.fna,test-data/split_libraries/reads_2.fna' \ | |
974 --qual 'test-data/split_libraries/reads_1.qual,test-data/split_libraries/reads_2.qual' \ | |
975 --min_qual_score 25 \ | |
976 --qual_score_window 0 \ | |
977 --record_qual_scores \ | |
978 --min_seq_length 200 \ | |
979 --max_seq_length 1000 \ | |
980 --max_ambig 6 \ | |
981 --max_homopolymer 6 \ | |
982 --max_primer_mismatch 0 \ | |
983 --barcode_type 'golay_12' \ | |
984 --max_barcode_errors 1.5 \ | |
985 --start_numbering_at 1 | |
986 cp split_libraries/seqs.fna 'test-data/split_libraries/seqs.fna' | |
987 cp split_libraries/split_library_log.txt 'test-data/split_libraries/split_library_log' | |
988 cp split_libraries/histograms.txt 'test-data/split_libraries/histograms.txt' | |
989 cp split_libraries/seqs_filtered.qual 'test-data/split_libraries/seqs_filtered.qual' | |
990 rm -rf split_libraries | |
991 | |
992 # split_libraries_fastq | |
993 split_libraries_fastq.py \ | |
994 --sequence_read_fps 'test-data/split_libraries_fastq/lane1_read1.fastq.gz' \ | |
995 -o split_libraries_1 \ | |
996 --mapping_fps 'test-data/split_libraries_fastq/map.txt' \ | |
997 --barcode_read_fps 'test-data/split_libraries_fastq/lane1_barcode.fastq.gz' \ | |
998 --max_bad_run_length 3 \ | |
999 --min_per_read_length_fraction 0.75 \ | |
1000 --sequence_max_n 0 \ | |
1001 --start_seq_id 0 \ | |
1002 --rev_comp_mapping_barcodes \ | |
1003 --phred_quality_threshold 19 \ | |
1004 --barcode_type 'golay_12' \ | |
1005 --max_barcode_errors 1.5 | |
1006 rm -rf split_libraries_1 | |
1007 | |
1008 split_libraries_fastq.py \ | |
1009 --sequence_read_fps 'test-data/split_libraries_fastq/lane1_read1.fastq.gz' \ | |
1010 -o split_libraries_2 \ | |
1011 --mapping_fps 'test-data/split_libraries_fastq/map.txt' \ | |
1012 --barcode_read_fps 'test-data/split_libraries_fastq/lane1_barcode.fastq.gz' \ | |
1013 --store_qual_scores \ | |
1014 --store_demultiplexed_fastq \ | |
1015 --max_bad_run_length 3 \ | |
1016 --min_per_read_length_fraction 0.75 \ | |
1017 --sequence_max_n 0 \ | |
1018 --start_seq_id 0 \ | |
1019 --rev_comp_mapping_barcodes \ | |
1020 --phred_quality_threshold 19 \ | |
1021 --barcode_type 'golay_12' \ | |
1022 --max_barcode_errors 1.5 | |
1023 rm -rf split_libraries_2 | |
1024 | |
1025 split_libraries_fastq.py \ | |
1026 --sequence_read_fps 'test-data/split_libraries_fastq/lane1_read1.fastq.gz,test-data/split_libraries_fastq/lane2_read1.fastq.gz' \ | |
1027 -o split_libraries_3 \ | |
1028 --mapping_fps 'test-data/split_libraries_fastq/map.txt,test-data/split_libraries_fastq/map.txt' \ | |
1029 --barcode_read_fps 'test-data/split_libraries_fastq/lane1_barcode.fastq.gz,test-data/split_libraries_fastq/lane2_barcode.fastq.gz' \ | |
1030 --max_bad_run_length 3 \ | |
1031 --min_per_read_length_fraction 0.75 \ | |
1032 --sequence_max_n 0 \ | |
1033 --start_seq_id 0 \ | |
1034 --rev_comp_mapping_barcodes \ | |
1035 --phred_quality_threshold 19 \ | |
1036 --barcode_type 'golay_12' \ | |
1037 --max_barcode_errors 1.5 | |
1038 rm -rf split_libraries_3 | |
1039 | |
1040 split_libraries_fastq.py \ | |
1041 --sequence_read_fps 'test-data/split_libraries_fastq/lane1_read1.fastq.gz' \ | |
1042 -o split_libraries_4 \ | |
1043 --sample_ids 'my.sample.1' \ | |
1044 --max_bad_run_length 3 \ | |
1045 --min_per_read_length_fraction 0.75 \ | |
1046 --sequence_max_n 0 \ | |
1047 --start_seq_id 0 \ | |
1048 --rev_comp_mapping_barcodes \ | |
1049 --phred_quality_threshold 19 \ | |
1050 --barcode_type 'not-barcoded' \ | |
1051 --max_barcode_errors 1.5 | |
1052 rm -rf split_libraries_4 | |
1053 | |
1054 split_libraries_fastq.py \ | |
1055 --sequence_read_fps 'test-data/split_libraries_fastq/lane1_read1.fastq.gz,test-data/split_libraries_fastq/lane2_read1.fastq.gz' \ | |
1056 -o split_libraries_5 \ | |
1057 --sample_ids 'my.sample.1,my.sample.2' \ | |
1058 --max_bad_run_length 3 \ | |
1059 --min_per_read_length_fraction 0.75 \ | |
1060 --sequence_max_n 0 \ | |
1061 --start_seq_id 0 \ | |
1062 --rev_comp_mapping_barcodes \ | |
1063 --phred_quality_threshold 19 \ | |
1064 --barcode_type 'not-barcoded' \ | |
1065 --max_barcode_errors 1.5 | |
1066 rm -rf split_libraries_5 | |
1067 | |
1068 # summarize_taxa | |
1069 cp 'test-data/core_diversity_analyses/otu_table.biom' 'test-data/summarize_taxa/otu_table.biom' | |
1070 cp 'test-data/core_diversity_analyses/map.txt' 'test-data/summarize_taxa/map.txt' | |
1071 | |
1072 summarize_taxa.py \ | |
1073 -i 'test-data/summarize_taxa/otu_table.biom' \ | |
1074 -o summarize_taxa_1 \ | |
1075 -L '2,3,4,5,6' \ | |
1076 -m 'test-data/summarize_taxa/map.txt' \ | |
1077 --md_identifier "taxonomy" \ | |
1078 --delimiter ";" | |
1079 cp summarize_taxa_1/*_L2.txt "test-data/summarize_taxa/1_L2.txt" | |
1080 cp summarize_taxa_1/*_L3.txt "test-data/summarize_taxa/1_L3.txt" | |
1081 cp summarize_taxa_1/*_L4.txt "test-data/summarize_taxa/1_L4.txt" | |
1082 cp summarize_taxa_1/*_L5.txt "test-data/summarize_taxa/1_L5.txt" | |
1083 cp summarize_taxa_1/*_L6.txt "test-data/summarize_taxa/1_L6.txt" | |
1084 rm -rf summarize_taxa_1 | |
1085 | |
1086 summarize_taxa.py \ | |
1087 -i 'test-data/summarize_taxa/otu_table.biom' \ | |
1088 -o summarize_taxa_2 \ | |
1089 -L '3,6' \ | |
1090 --md_identifier "taxonomy" \ | |
1091 --delimiter ";" | |
1092 cp summarize_taxa_2/*_L3.txt "test-data/summarize_taxa/2_L3.txt" | |
1093 cp summarize_taxa_2/*_L6.txt "test-data/summarize_taxa/2_L6.txt" | |
1094 rm -rf summarize_taxa_2 | |
1095 | |
1096 # summarize_taxa_through_plots | |
1097 summarize_taxa_through_plots.py \ | |
1098 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
1099 --output_dir summarize_taxa_through_plots_mapping \ | |
1100 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' | |
1101 biom convert \ | |
1102 -i 'summarize_taxa_through_plots_mapping/otu_table_L2.biom' \ | |
1103 -o 'summarize_taxa_through_plots_mapping/otu_table_L2_json.biom' \ | |
1104 --to-json | |
1105 biom convert \ | |
1106 -i 'summarize_taxa_through_plots_mapping/otu_table_L3.biom' \ | |
1107 -o 'summarize_taxa_through_plots_mapping/otu_table_L3_json.biom' \ | |
1108 --to-json | |
1109 biom convert \ | |
1110 -i 'summarize_taxa_through_plots_mapping/otu_table_L4.biom' \ | |
1111 -o 'summarize_taxa_through_plots_mapping/otu_table_L4_json.biom' \ | |
1112 --to-json | |
1113 biom convert \ | |
1114 -i 'summarize_taxa_through_plots_mapping/otu_table_L5.biom' \ | |
1115 -o 'summarize_taxa_through_plots_mapping/otu_table_L5_json.biom' \ | |
1116 --to-json | |
1117 biom convert \ | |
1118 -i 'summarize_taxa_through_plots_mapping/otu_table_L6.biom' \ | |
1119 -o 'summarize_taxa_through_plots_mapping/otu_table_L6_json.biom' \ | |
1120 --to-json | |
1121 cp summarize_taxa_through_plots_mapping/*.txt test-data/summarize_taxa_through_plots/mapping/ | |
1122 cp summarize_taxa_through_plots_mapping/*_json.biom test-data/summarize_taxa_through_plots/mapping/ | |
1123 cp summarize_taxa_through_plots_mapping/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping/area_charts.html' | |
1124 cp summarize_taxa_through_plots_mapping/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping/bar_charts.html' | |
1125 | |
1126 summarize_taxa_through_plots.py \ | |
1127 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
1128 --output_dir summarize_taxa_through_plots_mapping_categories \ | |
1129 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' \ | |
1130 --mapping_category 'Treatment' | |
1131 biom convert \ | |
1132 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L2.biom' \ | |
1133 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L2_json.biom' \ | |
1134 --to-json | |
1135 biom convert \ | |
1136 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L3.biom' \ | |
1137 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L3_json.biom' \ | |
1138 --to-json | |
1139 biom convert \ | |
1140 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L4.biom' \ | |
1141 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L4_json.biom' \ | |
1142 --to-json | |
1143 biom convert \ | |
1144 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L5.biom' \ | |
1145 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L5_json.biom' \ | |
1146 --to-json | |
1147 biom convert \ | |
1148 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L6.biom' \ | |
1149 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L6_json.biom' \ | |
1150 --to-json | |
1151 cp summarize_taxa_through_plots_mapping_categories/*.txt test-data/summarize_taxa_through_plots/mapping_categories/ | |
1152 cp summarize_taxa_through_plots_mapping_categories/*_json.biom test-data/summarize_taxa_through_plots/mapping_categories/ | |
1153 cp summarize_taxa_through_plots_mapping_categories/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping_categories/area_charts.html' | |
1154 cp summarize_taxa_through_plots_mapping_categories/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping_categories/bar_charts.html' | |
1155 | |
1156 summarize_taxa_through_plots.py \ | |
1157 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
1158 --output_dir summarize_taxa_through_plots_mapping_sort \ | |
1159 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' \ | |
1160 --sort | |
1161 biom convert \ | |
1162 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L2.biom' \ | |
1163 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L2_json.biom' \ | |
1164 --to-json | |
1165 biom convert \ | |
1166 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L3.biom' \ | |
1167 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L3_json.biom' \ | |
1168 --to-json | |
1169 biom convert \ | |
1170 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L4.biom' \ | |
1171 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L4_json.biom' \ | |
1172 --to-json | |
1173 biom convert \ | |
1174 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L5.biom' \ | |
1175 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L5_json.biom' \ | |
1176 --to-json | |
1177 biom convert \ | |
1178 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L6.biom' \ | |
1179 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L6_json.biom' \ | |
1180 --to-json | |
1181 cp summarize_taxa_through_plots_mapping_sort/*.txt test-data/summarize_taxa_through_plots/mapping_sort/ | |
1182 cp summarize_taxa_through_plots_mapping_sort/*_json.biom test-data/summarize_taxa_through_plots/mapping_sort/ | |
1183 cp summarize_taxa_through_plots_mapping_sort/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping_sort/area_charts.html' | |
1184 cp summarize_taxa_through_plots_mapping_sort/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping_sort/bar_charts.html' | |
1185 | |
1186 summarize_taxa_through_plots.py \ | |
1187 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
1188 --output_dir summarize_taxa_through_plots_without_mapping | |
1189 biom convert \ | |
1190 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L2.biom' \ | |
1191 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L2_json.biom' \ | |
1192 --to-json | |
1193 biom convert \ | |
1194 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L3.biom' \ | |
1195 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L3_json.biom' \ | |
1196 --to-json | |
1197 biom convert \ | |
1198 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L4.biom' \ | |
1199 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L4_json.biom' \ | |
1200 --to-json | |
1201 biom convert \ | |
1202 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L5.biom' \ | |
1203 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L5_json.biom' \ | |
1204 --to-json | |
1205 biom convert \ | |
1206 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L6.biom' \ | |
1207 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L6_json.biom' \ | |
1208 --to-json | |
1209 cp summarize_taxa_through_plots_without_mapping/*.txt test-data/summarize_taxa_through_plots/without_mapping/ | |
1210 cp summarize_taxa_through_plots_without_mapping/*_json.biom test-data/summarize_taxa_through_plots/without_mapping/ | |
1211 cp summarize_taxa_through_plots_without_mapping/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/without_mapping/area_charts.html' | |
1212 cp summarize_taxa_through_plots_without_mapping/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/without_mapping/bar_charts.html' | |
1213 | |
1214 # upgma_cluster | |
1215 upgma_cluster.py \ | |
1216 --input_path 'test-data/upgma_cluster/' \ | |
1217 --output_path 'test-data/upgma_cluster/' | |
1218 | |
1219 # validate_mapping_file | |
1220 validate_mapping_file.py \ | |
1221 -m 'test-data/validate_mapping_file/map.tsv' \ | |
1222 -o validate_mapping_file_output \ | |
1223 -c '_' | |
1224 cp validate_mapping_file_output/*.html 'test-data/validate_mapping_file/map.tsv.html' | |
1225 cp validate_mapping_file_output/*.log 'test-data/validate_mapping_file/map.tsv.log' | |
1226 cp validate_mapping_file_output/*corrected.txt 'test-data/validate_mapping_file/map.tsv_corrected.txt' | |
1227 rm -rf validate_mapping_file_output |