Mercurial > repos > iuc > qiime_split_libraries_fastq
comparison generate_test_data.sh @ 0:20194da2549d draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qiime/ commit a9d1e0debcd357d8080a1c6c5f1d206dd45a7a4d
| author | iuc | 
|---|---|
| date | Fri, 19 May 2017 03:54:05 -0400 | 
| parents | |
| children | 6e8fa1df22eb | 
   comparison
  equal
  deleted
  inserted
  replaced
| -1:000000000000 | 0:20194da2549d | 
|---|---|
| 1 #!/usr/bin/env bash | |
| 2 | |
| 3 # Data are from test data in https://github.com/biocore/qiime | |
| 4 | |
| 5 # align_seqs | |
| 6 align_seqs.py \ | |
| 7 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 8 -o 'align_seqs_pynast_uclust' \ | |
| 9 --alignment_method 'pynast' \ | |
| 10 --pairwise_alignment_method 'uclust' \ | |
| 11 --template_fp 'test-data/align_seqs/core_set_aligned.fasta.imputed' \ | |
| 12 --min_percent_id '0.75' | |
| 13 | |
| 14 align_seqs.py \ | |
| 15 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 16 -o 'align_seqs_pynast_muscle' \ | |
| 17 --alignment_method 'pynast' \ | |
| 18 --pairwise_alignment_method 'muscle' \ | |
| 19 --min_length '50' \ | |
| 20 --min_percent_id '0.75' | |
| 21 | |
| 22 align_seqs.py \ | |
| 23 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 24 -o 'align_seqs_pynast_pair_hmm' \ | |
| 25 --alignment_method 'pynast' \ | |
| 26 --pairwise_alignment_method 'pair_hmm' \ | |
| 27 --min_percent_id '0.75' | |
| 28 | |
| 29 #align_seqs.py \ | |
| 30 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 31 # -o 'align_seqs_pynast_clustal' \ | |
| 32 # --alignment_method 'pynast' \ | |
| 33 # --pairwise_alignment_method 'clustal' \ | |
| 34 # --min_percent_id '0.75' | |
| 35 | |
| 36 align_seqs.py \ | |
| 37 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 38 -o 'align_seqs_pynast_blast' \ | |
| 39 --alignment_method 'pynast' \ | |
| 40 --pairwise_alignment_method 'blast' \ | |
| 41 --min_percent_id '0.75' | |
| 42 | |
| 43 align_seqs.py \ | |
| 44 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 45 -o 'align_seqs_pynast_mafft' \ | |
| 46 --alignment_method 'pynast' \ | |
| 47 --pairwise_alignment_method 'mafft' \ | |
| 48 --min_percent_id '0.75' | |
| 49 | |
| 50 #align_seqs.py \ | |
| 51 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 52 # -o 'align_seqs_infernal' \ | |
| 53 # --alignment_method 'infernal' \ | |
| 54 # --template_fp 'test-data/align_seqs/seed.16s.reference_model.sto' \ | |
| 55 # --min_percent_id '0.75' | |
| 56 | |
| 57 #align_seqs.py \ | |
| 58 # --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 59 # -o 'align_seqs_clustalw' \ | |
| 60 # --alignment_method 'clustalw' \ | |
| 61 # --min_percent_id '0.75' | |
| 62 | |
| 63 align_seqs.py \ | |
| 64 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 65 -o 'align_seqs_muscle' \ | |
| 66 --alignment_method 'muscle' \ | |
| 67 --min_percent_id '0.75' | |
| 68 | |
| 69 align_seqs.py \ | |
| 70 --input_fasta_fp 'test-data/align_seqs/unaligned.fna' \ | |
| 71 -o 'align_seqs_mafft' \ | |
| 72 --alignment_method 'mafft' \ | |
| 73 --min_percent_id '0.75' | |
| 74 | |
| 75 #alpha_rarefaction | |
| 76 alpha_rarefaction.py \ | |
| 77 --otu_table_fp "test-data/alpha_rarefaction/otu_table.biom" \ | |
| 78 --mapping_fp "test-data/alpha_rarefaction/mapping_file.txt" \ | |
| 79 -o alpha_rarefaction \ | |
| 80 --num_steps '2' \ | |
| 81 --tree_fp "test-data/alpha_rarefaction/rep_set.tre" \ | |
| 82 --min_rare_depth '10' \ | |
| 83 --max_rare_depth '50' \ | |
| 84 --retain_intermediate_files | |
| 85 rm -rf alpha_rarefaction | |
| 86 | |
| 87 # assign_taxonomy | |
| 88 assign_taxonomy.py \ | |
| 89 --input_fasta_fp 'test-data/assign_taxonomy/uclust_input_seqs.fasta' \ | |
| 90 --assignment_method 'uclust' \ | |
| 91 --min_consensus_fraction '0.51' \ | |
| 92 --similarity '0.9' \ | |
| 93 --uclust_max_accepts '3' \ | |
| 94 -o assign_taxonomy_uclust | |
| 95 cp assign_taxonomy_uclust/uclust_input_seqs_tax_assignments.txt 'test-data/assign_taxonomy/uclust_taxonomic_assignation.txt' | |
| 96 rm -rf assign_taxonomy_uclust | |
| 97 | |
| 98 #assign_taxonomy.py \ | |
| 99 # --input_fasta_fp 'test-data/assign_taxonomy/rdp_input_seqs.fasta' \ | |
| 100 # --id_to_taxonomy_fp 'test-data/assign_taxonomy/rdp_id_to_taxonomy.txt' \ | |
| 101 # --assignment_method 'rdp' \ | |
| 102 # --confidence '3' \ | |
| 103 # -o assign_taxonomy_rdp | |
| 104 | |
| 105 #assign_taxonomy.py \ | |
| 106 # --input_fasta_fp 'test-data/assign_taxonomy/rtax_ref_seq_set.fna' \ | |
| 107 # --id_to_taxonomy_fp 'test-data/assign_taxonomy/rtax_id_to_taxonomy.txt' \ | |
| 108 # --assignment_method 'rtax' \ | |
| 109 # --read_1_seqs_fp 'test-data/assign_taxonomy/read_1.seqs.fna' \ | |
| 110 # --read_2_seqs_fp 'test-data/assign_taxonomy/read_2.seqs.fna' \ | |
| 111 # --single_ok \ | |
| 112 # --no_single_ok_generic \ | |
| 113 # --read_id_regex "\S+\s+(\S+)" \ | |
| 114 # --amplicon_id_regex "(\S+)\s+(\S+?)\/" \ | |
| 115 # --header_id_regex "\S+\s+(\S+?)\/" \ | |
| 116 # -o assign_taxonomy_rtax | |
| 117 #ls assign_taxonomy_rtax | |
| 118 | |
| 119 #assign_taxonomy.py \ | |
| 120 # --input_fasta_fp 'test-data/assign_taxonomy/mothur_ref_seq_set.fna' \ | |
| 121 # --id_to_taxonomy_fp 'test-data/assign_taxonomy/mothur_id_to_taxonomy.txt' \ | |
| 122 # --assignment_method 'mothur' \ | |
| 123 # --confidence 0.5 \ | |
| 124 # -o assign_taxonomy_mothur | |
| 125 #ls assign_taxonomy_mothur | |
| 126 | |
| 127 assign_taxonomy.py \ | |
| 128 --input_fasta_fp 'test-data/assign_taxonomy/mothur_ref_seq_set.fna' \ | |
| 129 --assignment_method 'sortmerna' \ | |
| 130 --min_consensus_fraction "0.51" \ | |
| 131 --similarity "0.9" \ | |
| 132 --sortmerna_e_value "1.0" \ | |
| 133 --sortmerna_coverage "0.9" \ | |
| 134 --sortmerna_best_N_alignments "5" \ | |
| 135 -o assign_taxonomy_sortmerna | |
| 136 cp assign_taxonomy_sortmerna/sortmerna_map.blast 'test-data/assign_taxonomy/sortmerna_map.blast' | |
| 137 cp assign_taxonomy_sortmerna/mothur_ref_seq_set_tax_assignments.txt 'test-data/assign_taxonomy/sortmerna_taxonomic_assignation.txt' | |
| 138 rm -rf assign_taxonomy_sortmerna | |
| 139 | |
| 140 #beta_diversity | |
| 141 beta_diversity.py \ | |
| 142 --input_path 'test-data/beta_diversity/otu_table.biom' \ | |
| 143 -o beta_diversity_1 \ | |
| 144 --metrics 'unweighted_unifrac,weighted_unifrac' \ | |
| 145 --tree_path 'test-data/beta_diversity/rep_set.tre' | |
| 146 md5 'beta_diversity_1/unweighted_unifrac_otu_table.txt' | |
| 147 md5 'beta_diversity_1/weighted_unifrac_otu_table.txt' | |
| 148 rm -rf beta_diversity_1 | |
| 149 | |
| 150 beta_diversity.py \ | |
| 151 --input_path 'test-data/beta_diversity/otu_table.biom' \ | |
| 152 -o beta_diversity_2 \ | |
| 153 --metrics 'abund_jaccard,binary_chisq,binary_chord,binary_euclidean,binary_hamming,binary_jaccard,binary_lennon,binary_ochiai,binary_pearson,binary_sorensen_dice,bray_curtis,canberra,chisq,chord,euclidean,gower,hellinger,kulczynski,manhattan,morisita_horn,pearson,soergel,spearman_approx,specprof,unifrac_g,unifrac_g_full_tree,unweighted_unifrac,unweighted_unifrac_full_tree,weighted_normalized_unifrac,weighted_unifrac' \ | |
| 154 --tree_path 'test-data/beta_diversity/rep_set.tre' | |
| 155 md5 'beta_diversity_2/canberra_otu_table.txt' | |
| 156 md5 'beta_diversity_2/pearson_otu_table.txt' | |
| 157 rm -rf beta_diversity_2 | |
| 158 | |
| 159 #beta_diversity_through_plots | |
| 160 beta_diversity_through_plots.py \ | |
| 161 --otu_table_fp 'test-data/beta_diversity_through_plots/otu_table.biom' \ | |
| 162 --mapping_fp 'test-data/beta_diversity_through_plots/map.txt' \ | |
| 163 --output_dir beta_diversity_through_plots \ | |
| 164 --tree_fp 'test-data/beta_diversity_through_plots/rep_set.tre' \ | |
| 165 --parallel | |
| 166 cp beta_diversity_through_plots/unweighted_unifrac_dm.txt 'test-data/beta_diversity_through_plots/' | |
| 167 cp beta_diversity_through_plots/unweighted_unifrac_pc.txt 'test-data/beta_diversity_through_plots/' | |
| 168 cp beta_diversity_through_plots/weighted_unifrac_dm.txt 'test-data/beta_diversity_through_plots/' | |
| 169 cp beta_diversity_through_plots/weighted_unifrac_pc.txt 'test-data/beta_diversity_through_plots/' | |
| 170 rm -rf beta_diversity_through_plots | |
| 171 | |
| 172 # compare_categories | |
| 173 compare_categories.py \ | |
| 174 --method 'adonis' \ | |
| 175 --input_dm 'test-data/compare_categories/unweighted_unifrac_dm.txt' \ | |
| 176 --mapping_file 'test-data/compare_categories/map.txt' \ | |
| 177 --categories 'Treatment' \ | |
| 178 -o compare_categories_1 \ | |
| 179 --num_permutations '999' | |
| 180 cp compare_categories_1/adonis_results.txt "test-data/compare_categories/adonis_results.txt" | |
| 181 rm -rf compare_categories_1 | |
| 182 | |
| 183 compare_categories.py \ | |
| 184 --method 'dbrda' \ | |
| 185 --input_dm 'test-data/compare_categories/unweighted_unifrac_dm.txt' \ | |
| 186 --mapping_file 'test-data/compare_categories/map.txt' \ | |
| 187 --categories 'Treatment' \ | |
| 188 -o compare_categories_2 \ | |
| 189 --num_permutations '99' | |
| 190 cp compare_categories_2/* "test-data/compare_categories/" | |
| 191 rm -rf compare_categories_2 | |
| 192 | |
| 193 # core_diversity_analyses | |
| 194 core_diversity_analyses.py \ | |
| 195 --input_biom_fp 'test-data/core_diversity_analyses/otu_table.biom' \ | |
| 196 -o core_diversity_analyses_1 \ | |
| 197 --mapping_fp 'test-data/core_diversity_analyses/map.txt' \ | |
| 198 --sampling_depth 22 \ | |
| 199 --tree_fp 'test-data/core_diversity_analyses/rep_set.tre' | |
| 200 cp core_diversity_analyses_1/bdiv_even22/unweighted_unifrac_pc.txt 'test-data/core_diversity_analyses/unweighted_unifrac_pc.txt' | |
| 201 rm -rf core_diversity_analyses_1 | |
| 202 | |
| 203 core_diversity_analyses.py \ | |
| 204 --input_biom_fp 'test-data/core_diversity_analyses/otu_table.biom' \ | |
| 205 -o core_diversity_analyses_2 \ | |
| 206 --mapping_fp 'test-data/core_diversity_analyses/map.txt' \ | |
| 207 --sampling_depth 22 \ | |
| 208 --nonphylogenetic_diversity \ | |
| 209 --suppress_taxa_summary \ | |
| 210 --suppress_beta_diversity \ | |
| 211 --suppress_alpha_diversity \ | |
| 212 --suppress_group_significance | |
| 213 rm -rf core_diversity_analyses_2 | |
| 214 | |
| 215 # filter_alignment | |
| 216 filter_alignment.py \ | |
| 217 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
| 218 -o 'filter_alignment_default' \ | |
| 219 --allowed_gap_frac '0.999999' \ | |
| 220 --threshold '3.0' | |
| 221 | |
| 222 filter_alignment.py \ | |
| 223 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
| 224 -o 'filter_alignment_without_mask_filter_and_outliers' \ | |
| 225 --suppress_lane_mask_filter \ | |
| 226 --allowed_gap_frac '0.999999' \ | |
| 227 --remove_outliers \ | |
| 228 --threshold '3.0' | |
| 229 | |
| 230 filter_alignment.py \ | |
| 231 --input_fasta_file 'test-data/filter_alignment/alignment.fasta' \ | |
| 232 -o 'filter_alignment_entropy' \ | |
| 233 --allowed_gap_frac '0.999999' \ | |
| 234 --threshold '3.0' \ | |
| 235 --entropy_threshold '0.1' | |
| 236 | |
| 237 # filter_fasta | |
| 238 filter_fasta.py \ | |
| 239 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 240 --output_fasta_fp 'filter_fasta_otu_map.fasta' \ | |
| 241 --otu_map 'test-data/filter_fasta/otu_map.txt' | |
| 242 | |
| 243 filter_fasta.py \ | |
| 244 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 245 --output_fasta_fp 'filter_fasta_otu_map_negate.fasta' \ | |
| 246 --otu_map 'test-data/filter_fasta/otu_map.txt' \ | |
| 247 --negate | |
| 248 | |
| 249 filter_fasta.py \ | |
| 250 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 251 --output_fasta_fp 'filter_fasta_seq_id.fasta' \ | |
| 252 --seq_id_fp 'test-data/filter_fasta/seqs_to_keep.txt' | |
| 253 | |
| 254 filter_fasta.py \ | |
| 255 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 256 --output_fasta_fp 'filter_fasta_otu_table.fasta' \ | |
| 257 --biom_fp 'test-data/filter_fasta/otu_table.biom' | |
| 258 | |
| 259 filter_fasta.py \ | |
| 260 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 261 --output_fasta_fp 'filter_fasta_subject_fasta.fasta' \ | |
| 262 --subject_fasta_fp 'test-data/filter_fasta/sl_inseqs.fasta' | |
| 263 | |
| 264 filter_fasta.py \ | |
| 265 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 266 --output_fasta_fp 'filter_fasta_seq_id_prefix.fasta' \ | |
| 267 --seq_id_prefix 'S5' | |
| 268 | |
| 269 filter_fasta.py \ | |
| 270 --input_fasta_fp 'test-data/filter_fasta/inseqs.fasta' \ | |
| 271 --output_fasta_fp 'filter_fasta_sample_id.fasta' \ | |
| 272 --sample_id_fp 'test-data/filter_fasta/map.txt' | |
| 273 | |
| 274 # filter_otus_from_otu_table | |
| 275 filter_otus_from_otu_table.py \ | |
| 276 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
| 277 --min_count '2' \ | |
| 278 --max_count '1000' \ | |
| 279 --min_samples '5' \ | |
| 280 --max_samples '350' \ | |
| 281 --output_fp 'test-data/filter_otus_from_otu_table/filtered_otu_table.biom' | |
| 282 | |
| 283 filter_otus_from_otu_table.py \ | |
| 284 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
| 285 --otu_ids_to_exclude_fp 'test-data/filter_otus_from_otu_table/chimeric_otus.txt' \ | |
| 286 --output_fp 'test-data/filter_otus_from_otu_table/chimera_filtered_otu_table.biom' | |
| 287 | |
| 288 filter_otus_from_otu_table.py \ | |
| 289 --input_fp 'test-data/filter_otus_from_otu_table/otu_table.biom' \ | |
| 290 --otu_ids_to_exclude_fp 'test-data/filter_otus_from_otu_table/chimeric_otus.txt' \ | |
| 291 --negate_ids_to_exclude \ | |
| 292 --output_fp 'test-data/filter_otus_from_otu_table/chimera_picked_otu_table.biom' | |
| 293 | |
| 294 # filter_samples_from_otu_table | |
| 295 filter_samples_from_otu_table.py \ | |
| 296 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 297 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 298 --min_count '150' | |
| 299 biom convert \ | |
| 300 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 301 -o 'test-data/filter_samples_from_otu_table/abundance_min.biom' \ | |
| 302 --to-json | |
| 303 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 304 | |
| 305 filter_samples_from_otu_table.py \ | |
| 306 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 307 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 308 --min_count '0' \ | |
| 309 --max_count '149' | |
| 310 biom convert \ | |
| 311 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 312 -o 'test-data/filter_samples_from_otu_table/abundance_max.biom' \ | |
| 313 --to-json | |
| 314 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 315 | |
| 316 filter_samples_from_otu_table.py \ | |
| 317 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 318 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 319 --mapping_fp 'test-data/filter_samples_from_otu_table/map.txt' \ | |
| 320 --output_mapping_fp 'test-data/filter_samples_from_otu_table/metadata_positive.txt' \ | |
| 321 -s 'Treatment:Control' | |
| 322 biom convert \ | |
| 323 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 324 -o 'test-data/filter_samples_from_otu_table/metadata_positive.biom' \ | |
| 325 --to-json | |
| 326 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 327 | |
| 328 filter_samples_from_otu_table.py \ | |
| 329 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 330 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 331 --mapping_fp 'test-data/filter_samples_from_otu_table/map.txt' \ | |
| 332 -s 'Treatment:*,!Control' | |
| 333 biom convert \ | |
| 334 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 335 -o 'test-data/filter_samples_from_otu_table/metadata_negative.biom' \ | |
| 336 --to-json | |
| 337 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 338 | |
| 339 filter_samples_from_otu_table.py \ | |
| 340 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 341 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 342 --sample_id_fp 'test-data/filter_samples_from_otu_table/ids.txt' | |
| 343 biom convert \ | |
| 344 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 345 -o 'test-data/filter_samples_from_otu_table/id_positive.biom' \ | |
| 346 --to-json | |
| 347 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 348 | |
| 349 filter_samples_from_otu_table.py \ | |
| 350 --input_fp 'test-data/filter_samples_from_otu_table/otu_table.biom' \ | |
| 351 --output_fp 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 352 --sample_id_fp 'test-data/filter_samples_from_otu_table/ids.txt' \ | |
| 353 --negate_sample_id_fp | |
| 354 biom convert \ | |
| 355 -i 'test-data/filter_samples_from_otu_table/tmp.biom' \ | |
| 356 -o 'test-data/filter_samples_from_otu_table/id_negative.biom' \ | |
| 357 --to-json | |
| 358 rm 'test-data/filter_samples_from_otu_table/tmp.biom' | |
| 359 | |
| 360 # filter_taxa_from_otu_table | |
| 361 filter_taxa_from_otu_table.py \ | |
| 362 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
| 363 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 364 --positive_taxa 'p__Bacteroidetes,p__Firmicutes' \ | |
| 365 --metadata_field 'taxonomy' | |
| 366 biom convert \ | |
| 367 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 368 -o 'test-data/filter_taxa_from_otu_table/positive_taxa.biom' \ | |
| 369 --to-json | |
| 370 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
| 371 | |
| 372 filter_taxa_from_otu_table.py \ | |
| 373 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
| 374 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 375 --negative_taxa 'p__Bacteroidetes,p__Firmicutes' \ | |
| 376 --metadata_field 'taxonomy' | |
| 377 biom convert \ | |
| 378 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 379 -o 'test-data/filter_taxa_from_otu_table/negative_taxa.biom' \ | |
| 380 --to-json | |
| 381 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
| 382 | |
| 383 filter_taxa_from_otu_table.py \ | |
| 384 --input_otu_table_fp 'test-data/filter_taxa_from_otu_table/otu_table.biom' \ | |
| 385 --output_otu_table_fp 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 386 --positive_taxa 'p__Firmicutes' \ | |
| 387 --negative_taxa 'c__Clostridia' \ | |
| 388 --metadata_field 'taxonomy' | |
| 389 biom convert \ | |
| 390 -i 'test-data/filter_taxa_from_otu_table/tmp.biom' \ | |
| 391 -o 'test-data/filter_taxa_from_otu_table/positive_negative_taxa.biom' \ | |
| 392 --to-json | |
| 393 rm 'test-data/filter_taxa_from_otu_table/tmp.biom' | |
| 394 | |
| 395 # jackknifed_beta_diversity | |
| 396 jackknifed_beta_diversity.py \ | |
| 397 --otu_table_fp 'test-data/jackknifed_beta_diversity/otu_table.biom' \ | |
| 398 --mapping_fp 'test-data/jackknifed_beta_diversity/map.txt' \ | |
| 399 -o jackknifed_beta_diversity \ | |
| 400 --seqs_per_sample '10' \ | |
| 401 --tree_fp 'test-data/jackknifed_beta_diversity/rep_set.tre' \ | |
| 402 --master_tree 'consensus' \ | |
| 403 --parallel | |
| 404 rm -rf jackknifed_beta_diversity | |
| 405 | |
| 406 # make_emperor | |
| 407 cp 'test-data/core_diversity_analyses/unweighted_unifrac_pc.txt' 'test-data/make_emperor/unweighted_unifrac_pc.txt' | |
| 408 cp 'test-data/core_diversity_analyses/map.txt' 'test-data/make_emperor/map.txt' | |
| 409 cp 'test-data/summarize_taxa/2_L3.txt' 'test-data/make_emperor/2_L3.txt' | |
| 410 | |
| 411 make_emperor.py \ | |
| 412 --input_coords 'test-data/make_emperor/unweighted_unifrac_pc.txt' \ | |
| 413 -o make_emperor_1 \ | |
| 414 --map_fp 'test-data/make_emperor/map.txt' \ | |
| 415 --number_of_axes '10' \ | |
| 416 --add_unique_columns \ | |
| 417 --number_of_segments 8 | |
| 418 rm -rf make_emperor_1 | |
| 419 | |
| 420 make_emperor.py \ | |
| 421 --input_coords 'test-data/make_emperor/unweighted_unifrac_pc.txt' \ | |
| 422 -o make_emperor_2 \ | |
| 423 --map_fp 'test-data/make_emperor/map.txt' \ | |
| 424 --number_of_axes '10' \ | |
| 425 --add_unique_columns \ | |
| 426 --number_of_segments 8 \ | |
| 427 --taxa_fp 'test-data/make_emperor/2_L3.txt' \ | |
| 428 --n_taxa_to_keep 10 | |
| 429 rm -rf make_emperor_2 | |
| 430 | |
| 431 # make_otu_heatmap | |
| 432 make_otu_heatmap.py \ | |
| 433 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 434 --imagetype 'pdf' \ | |
| 435 --color_scheme "YlGn" \ | |
| 436 --width "5" \ | |
| 437 --height "5" \ | |
| 438 --dpi "200" \ | |
| 439 --obs_md_category "taxonomy" \ | |
| 440 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.pdf' | |
| 441 | |
| 442 make_otu_heatmap.py \ | |
| 443 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 444 --imagetype 'png' \ | |
| 445 --color_scheme "YlGn" \ | |
| 446 --width "5" \ | |
| 447 --height "5" \ | |
| 448 --dpi "200" \ | |
| 449 --obs_md_category "taxonomy" \ | |
| 450 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.png' | |
| 451 | |
| 452 make_otu_heatmap.py \ | |
| 453 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 454 --imagetype 'svg' \ | |
| 455 --color_scheme "YlGn" \ | |
| 456 --width "5" \ | |
| 457 --height "5" \ | |
| 458 --dpi "200" \ | |
| 459 --obs_md_category "taxonomy" \ | |
| 460 --output_fp 'test-data/make_otu_heatmap/basic_heatmap.svg' | |
| 461 | |
| 462 make_otu_heatmap.py \ | |
| 463 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 464 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
| 465 --imagetype 'pdf' \ | |
| 466 --color_scheme "YlGn" \ | |
| 467 --width "5" \ | |
| 468 --height "5" \ | |
| 469 --dpi "200" \ | |
| 470 --obs_md_category "taxonomy" \ | |
| 471 --output_fp 'test-data/make_otu_heatmap/sample_sorted_heatmap.pdf' | |
| 472 | |
| 473 make_otu_heatmap.py \ | |
| 474 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 475 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
| 476 --otu_tree 'test-data/make_otu_heatmap/rep_set.tre' \ | |
| 477 --imagetype 'pdf' \ | |
| 478 --color_scheme "YlGn" \ | |
| 479 --width "5" \ | |
| 480 --height "5" \ | |
| 481 --dpi "200" \ | |
| 482 --obs_md_category "taxonomy" \ | |
| 483 --output_fp 'test-data/make_otu_heatmap/sample_otu_sorted_heatmap.pdf' | |
| 484 | |
| 485 make_otu_heatmap.py \ | |
| 486 --otu_table_fp 'test-data/make_otu_heatmap/otu_table.biom' \ | |
| 487 --map_fname 'test-data/make_otu_heatmap/mapping_file.txt' \ | |
| 488 --category "Treatment" \ | |
| 489 --imagetype 'pdf' \ | |
| 490 --color_scheme "YlGn" \ | |
| 491 --width "5" \ | |
| 492 --height "5" \ | |
| 493 --dpi "200" \ | |
| 494 --obs_md_category "taxonomy" \ | |
| 495 --output_fp 'test-data/make_otu_heatmap/treatment_sample_sorted_heatmap.pdf' | |
| 496 | |
| 497 # make_phylogeny | |
| 498 make_phylogeny.py \ | |
| 499 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 500 --result_fp 'test-data/make_phylogeny/fasttree_tree_method_default.tre' \ | |
| 501 --tree_method 'fasttree' \ | |
| 502 --log_fp 'fasttree_tree_method_default.txt' \ | |
| 503 --root_method 'tree_method_default' | |
| 504 | |
| 505 make_phylogeny.py \ | |
| 506 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 507 --result_fp 'raxml_v730.tre' \ | |
| 508 --tree_method 'raxml_v730' \ | |
| 509 --log_fp 'raxml_v730.txt' \ | |
| 510 --root_method 'tree_method_default' | |
| 511 | |
| 512 make_phylogeny.py \ | |
| 513 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 514 --result_fp 'test-data/make_phylogeny/muscle.tre' \ | |
| 515 --tree_method 'muscle' \ | |
| 516 --log_fp 'muscle.txt' \ | |
| 517 --root_method 'tree_method_default' | |
| 518 | |
| 519 make_phylogeny.py \ | |
| 520 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 521 --result_fp 'test-data/make_phylogeny/clustalw.tre' \ | |
| 522 --tree_method 'clustalw' \ | |
| 523 --log_fp 'clustalw.txt' \ | |
| 524 --root_method 'tree_method_default' | |
| 525 | |
| 526 make_phylogeny.py \ | |
| 527 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 528 --result_fp 'clearcut.tre' \ | |
| 529 --tree_method 'clearcut' \ | |
| 530 --log_fp 'clearcut.txt' \ | |
| 531 --root_method 'tree_method_default' | |
| 532 | |
| 533 make_phylogeny.py \ | |
| 534 --input_fp 'test-data/make_phylogeny/aligned.fasta' \ | |
| 535 --result_fp 'test-data/make_phylogeny/fasttree_midpoint.tre' \ | |
| 536 --tree_method 'fasttree' \ | |
| 537 --log_fp 'fasttree_midpoint.txt' \ | |
| 538 --root_method 'midpoint' | |
| 539 | |
| 540 # multiple_join_paired_ends | |
| 541 multiple_join_paired_ends.py \ | |
| 542 --input_dir 'test-data/multiple_join_paired_ends/without_barcode/' \ | |
| 543 --output_dir 'test-data/multiple_join_paired_ends/output_without_barcode' \ | |
| 544 --read1_indicator 'forward_' \ | |
| 545 --read2_indicator 'reverse_' \ | |
| 546 --leading_text '' \ | |
| 547 --trailing_text '' | |
| 548 | |
| 549 #multiple_join_paired_ends.py \ | |
| 550 # --input_dir 'test-data/multiple_join_paired_ends/without_barcode/' \ | |
| 551 # --output_dir 'multiple_join_paired_ends_without_barcode_parameter_files' \ | |
| 552 # --parameter_fp 'test-data/multiple_join_paired_ends/qiime_parameters.txt' \ | |
| 553 # --read1_indicator '_R1_' \ | |
| 554 # --read2_indicator '_R2_' \ | |
| 555 # --leading_text '' \ | |
| 556 # --trailing_text '' | |
| 557 | |
| 558 multiple_join_paired_ends.py \ | |
| 559 --input_dir 'test-data/multiple_join_paired_ends/with_barcode/' \ | |
| 560 --output_dir 'test-data/multiple_join_paired_ends/output_with_barcode' \ | |
| 561 --read1_indicator 'forward_' \ | |
| 562 --read2_indicator 'reverse_' \ | |
| 563 --match_barcodes \ | |
| 564 --barcode_indicator 'barcode_' \ | |
| 565 --leading_text '' \ | |
| 566 --trailing_text '' | |
| 567 | |
| 568 # multiple_split_libraries_fastq | |
| 569 multiple_split_libraries_fastq.py \ | |
| 570 --input_dir 'test-data/multiple_split_libraries_fastq/input' \ | |
| 571 --output_dir 'multiple_split_libraries_fastq' \ | |
| 572 --demultiplexing_method 'mapping_barcode_files' \ | |
| 573 --read_indicator 'reads_' \ | |
| 574 --barcode_indicator 'barcodes_' \ | |
| 575 --mapping_indicator 'mapping_' \ | |
| 576 --mapping_extensions 'txt' \ | |
| 577 --leading_text '' \ | |
| 578 --trailing_text '' \ | |
| 579 --sampleid_indicator '.' | |
| 580 | |
| 581 multiple_split_libraries_fastq.py \ | |
| 582 --input_dir 'test-data/multiple_split_libraries_fastq/input' \ | |
| 583 --output_dir 'multiple_split_libraries_fastq_with_parameter_file' \ | |
| 584 --demultiplexing_method 'mapping_barcode_files' \ | |
| 585 --parameter_fp 'test-data/multiple_split_libraries_fastq/qiime_parameters.txt' \ | |
| 586 --read_indicator 'reads_' \ | |
| 587 --barcode_indicator 'barcodes_' \ | |
| 588 --mapping_indicator 'mapping_' \ | |
| 589 --mapping_extensions 'txt' \ | |
| 590 --leading_text '' \ | |
| 591 --trailing_text '' \ | |
| 592 --sampleid_indicator '.' | |
| 593 | |
| 594 # pick_closed_reference_otus | |
| 595 pick_closed_reference_otus.py \ | |
| 596 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
| 597 --output_dir 'pick_closed_reference_otus' \ | |
| 598 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
| 599 --taxonomy_fp 'test-data/pick_closed_reference_otus/taxa.txt' | |
| 600 biom convert \ | |
| 601 -i 'pick_closed_reference_otus/otu_table.biom' \ | |
| 602 -o 'test-data/pick_closed_reference_otus/basic_otu_table.biom' \ | |
| 603 --to-json | |
| 604 | |
| 605 pick_closed_reference_otus.py \ | |
| 606 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
| 607 --output_dir 'pick_closed_reference_otus_sortmerna' \ | |
| 608 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
| 609 --taxonomy_fp 'test-data/pick_closed_reference_otus/taxa.txt' \ | |
| 610 --parameter_fp 'test-data/pick_closed_reference_otus/sortmerna_params.txt' | |
| 611 biom convert \ | |
| 612 -i 'pick_closed_reference_otus_sortmerna/otu_table.biom' \ | |
| 613 -o 'test-data/pick_closed_reference_otus/sortmerna_otu_table.biom' \ | |
| 614 --to-json | |
| 615 | |
| 616 pick_closed_reference_otus.py \ | |
| 617 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
| 618 --output_dir 'pick_closed_reference_otus_assign_taxonomy' \ | |
| 619 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
| 620 --assign_taxonomy | |
| 621 biom convert \ | |
| 622 -i 'pick_closed_reference_otus_assign_taxonomy/otu_table.biom' \ | |
| 623 -o 'test-data/pick_closed_reference_otus/assign_taxonomy_otu_table.biom' \ | |
| 624 --to-json | |
| 625 | |
| 626 pick_closed_reference_otus.py \ | |
| 627 --input_fp 'test-data/pick_closed_reference_otus/seqs.fna' \ | |
| 628 --output_dir 'pick_closed_reference_otus_suppress_taxonomy_assignment' \ | |
| 629 --reference_fp 'test-data/pick_closed_reference_otus/refseqs.fna' \ | |
| 630 --suppress_taxonomy_assignment | |
| 631 biom convert \ | |
| 632 -i 'pick_closed_reference_otus_suppress_taxonomy_assignment/otu_table.biom' \ | |
| 633 -o 'test-data/pick_closed_reference_otus/suppress_taxonomy_assignment_otu_table.biom' \ | |
| 634 --to-json | |
| 635 | |
| 636 # pick_open_reference_otus | |
| 637 pick_open_reference_otus.py \ | |
| 638 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
| 639 -o pick_open_reference_otus_1 \ | |
| 640 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
| 641 --otu_picking_method 'uclust' \ | |
| 642 --new_ref_set_id 'New' \ | |
| 643 --parallel \ | |
| 644 --percent_subsample '0.001' \ | |
| 645 --prefilter_percent_id '0.0' \ | |
| 646 --minimum_failure_threshold '100000' \ | |
| 647 --min_otu_size '2' | |
| 648 cp pick_open_reference_otus_1/final_otu_map.txt 'test-data/pick_open_reference_otus/1_final_otu_map.txt' | |
| 649 cp pick_open_reference_otus_1/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/1_final_otu_map_mc.txt' | |
| 650 cp pick_open_reference_otus_1/rep_set.tre 'test-data/pick_open_reference_otus/1_rep_set_tree.tre' | |
| 651 rm -rf pick_open_reference_otus_1 | |
| 652 | |
| 653 pick_open_reference_otus.py \ | |
| 654 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
| 655 -o pick_open_reference_otus_2 \ | |
| 656 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
| 657 --otu_picking_method 'uclust' \ | |
| 658 --new_ref_set_id 'New' \ | |
| 659 --parallel \ | |
| 660 --percent_subsample '0.001' \ | |
| 661 --prefilter_percent_id '0.0' \ | |
| 662 --minimum_failure_threshold '100000' \ | |
| 663 --min_otu_size '3' \ | |
| 664 --suppress_taxonomy_assignment \ | |
| 665 --suppress_align_and_tree | |
| 666 cp pick_open_reference_otus_2/final_otu_map.txt 'test-data/pick_open_reference_otus/2_final_otu_map.txt' | |
| 667 cp pick_open_reference_otus_2/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/2_final_otu_map_mc.txt' | |
| 668 rm -rf pick_open_reference_otus_2 | |
| 669 | |
| 670 pick_open_reference_otus.py \ | |
| 671 --input_fps 'test-data/pick_open_reference_otus/sequences.fasta' \ | |
| 672 -o pick_open_reference_otus_3 \ | |
| 673 --reference_fp 'test-data/gg_13_8_79_otus.fasta' \ | |
| 674 --otu_picking_method 'uclust' \ | |
| 675 --new_ref_set_id 'New' \ | |
| 676 --parallel \ | |
| 677 --percent_subsample '0.001' \ | |
| 678 --prefilter_percent_id '0.0' \ | |
| 679 --minimum_failure_threshold '100000' \ | |
| 680 --min_otu_size '10' \ | |
| 681 --suppress_taxonomy_assignment | |
| 682 cp pick_open_reference_otus_3/final_otu_map.txt 'test-data/pick_open_reference_otus/3_final_otu_map.txt' | |
| 683 cp pick_open_reference_otus_3/final_otu_map_mc*.txt 'test-data/pick_open_reference_otus/3_final_otu_map_mc.txt' | |
| 684 cp pick_open_reference_otus_3/rep_set.tre 'test-data/pick_open_reference_otus/3_rep_set_tree.tre' | |
| 685 rm -rf pick_open_reference_otus_3 | |
| 686 | |
| 687 # pick_otus | |
| 688 pick_otus.py \ | |
| 689 -i 'test-data/pick_otus/seqs.fna' \ | |
| 690 -o 'pick_otus_uclust' \ | |
| 691 --otu_picking_method 'uclust' \ | |
| 692 --similarity "0.97" \ | |
| 693 --denovo_otu_id_prefix "denovo" \ | |
| 694 --max_accepts "1" \ | |
| 695 --max_rejects "8" \ | |
| 696 --stepwords "8" \ | |
| 697 --word_length "8" \ | |
| 698 --non_chimeras_retention "union" | |
| 699 | |
| 700 pick_otus.py \ | |
| 701 -i 'test-data/pick_otus/seqs.fna' \ | |
| 702 -o 'pick_otus_sortmerna' \ | |
| 703 --otu_picking_method "sortmerna" \ | |
| 704 --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
| 705 --sortmerna_e_value "1" \ | |
| 706 --sortmerna_coverage "0.97" \ | |
| 707 --sortmerna_tabular \ | |
| 708 --sortmerna_best_N_alignments "1" \ | |
| 709 --sortmerna_max_pos "10000" \ | |
| 710 --similarity "0.97" \ | |
| 711 --non_chimeras_retention "union" | |
| 712 | |
| 713 #pick_otus.py \ | |
| 714 # -i 'test-data/pick_otus/seqs.fna' \ | |
| 715 # -o 'pick_otus_mothur' \ | |
| 716 # --otu_picking_method "mothur" \ | |
| 717 # --clustering_algorithm "furthest" \ | |
| 718 # --non_chimeras_retention "union" | |
| 719 | |
| 720 pick_otus.py \ | |
| 721 -i 'test-data/pick_otus/seqs.fna' \ | |
| 722 -o 'pick_otus_trie' \ | |
| 723 --otu_picking_method "trie" \ | |
| 724 --non_chimeras_retention "union" | |
| 725 | |
| 726 pick_otus.py \ | |
| 727 -i 'test-data/pick_otus/seqs.fna' \ | |
| 728 -o 'pick_otus_uclust_ref' \ | |
| 729 --otu_picking_method "uclust_ref" \ | |
| 730 --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
| 731 --similarity "0.97" \ | |
| 732 --max_accepts "1" \ | |
| 733 --max_rejects "8" \ | |
| 734 --stepwords "8" \ | |
| 735 --word_length "8" \ | |
| 736 --non_chimeras_retention "union" | |
| 737 | |
| 738 #pick_otus.py \ | |
| 739 # -i 'test-data/pick_otus/seqs.fna' \ | |
| 740 # -o 'pick_otus_blast' \ | |
| 741 # --otu_picking_method "blast" \ | |
| 742 # --refseqs_fp "test-data/pick_otus/refseqs.fasta" \ | |
| 743 # --similarity "0.97" \ | |
| 744 # --max_e_value_blast "1e-10" \ | |
| 745 # --min_aligned_percent "0.5" \ | |
| 746 # --non_chimeras_retention "union" | |
| 747 | |
| 748 # pick_otus.py \ | |
| 749 # -i 'test-data/pick_otus/seqs.fna' \ | |
| 750 # -o 'pick_otus_sumaclust' \ | |
| 751 # --otu_picking_method "sumaclust" \ | |
| 752 # --similarity "0.97" \ | |
| 753 # --sumaclust_l \ | |
| 754 # --denovo_otu_id_prefix "denovo" \ | |
| 755 # --non_chimeras_retention "union" | |
| 756 | |
| 757 pick_otus.py \ | |
| 758 -i 'test-data/pick_otus/seqs.fna' \ | |
| 759 -o 'pick_otus_swarm' \ | |
| 760 --otu_picking_method "swarm" \ | |
| 761 --denovo_otu_id_prefix "denovo" \ | |
| 762 --swarm_resolution "1" \ | |
| 763 --non_chimeras_retention "union" | |
| 764 | |
| 765 pick_otus.py \ | |
| 766 -i 'test-data/pick_otus/seqs.fna' \ | |
| 767 -o 'pick_otus_prefix_suffix' \ | |
| 768 --otu_picking_method "prefix_suffix" \ | |
| 769 --prefix_length "50" \ | |
| 770 --suffix_length "50" \ | |
| 771 --non_chimeras_retention "union" | |
| 772 | |
| 773 pick_otus.py \ | |
| 774 -i 'test-data/pick_otus/seqs.fna' \ | |
| 775 -o 'pick_otus_cdhit' \ | |
| 776 --otu_picking_method "cdhit" \ | |
| 777 --similarity "0.97" \ | |
| 778 --non_chimeras_retention "union" | |
| 779 | |
| 780 pick_otus.py \ | |
| 781 -i 'test-data/pick_otus/seqs.fna' \ | |
| 782 -o 'pick_otus_uclust_intersection' \ | |
| 783 --otu_picking_method "uclust" \ | |
| 784 --similarity "0.97" \ | |
| 785 --denovo_otu_id_prefix "denovo" \ | |
| 786 --max_accepts "1" \ | |
| 787 --max_rejects "8" \ | |
| 788 --stepwords "8" \ | |
| 789 --word_length "8" \ | |
| 790 --non_chimeras_retention "intersection" | |
| 791 | |
| 792 # pick_rep_set | |
| 793 pick_rep_set.py \ | |
| 794 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 795 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 796 --rep_set_picking_method 'first' \ | |
| 797 --sort_by 'otu' \ | |
| 798 --result_fp 'test-data/pick_rep_set/first_otu_fasta.fasta' \ | |
| 799 --log_fp 'test-data/pick_rep_set/first_otu_fasta.txt' | |
| 800 | |
| 801 pick_rep_set.py \ | |
| 802 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 803 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 804 --reference_seqs_fp 'test-data/pick_rep_set/refseqs.fasta' \ | |
| 805 --rep_set_picking_method 'first' \ | |
| 806 --sort_by 'otu' \ | |
| 807 --result_fp 'test-data/pick_rep_set/first_otu_fasta_ref.fasta' \ | |
| 808 --log_fp 'test-data/pick_rep_set/first_otu_fasta_ref.txt' | |
| 809 | |
| 810 pick_rep_set.py \ | |
| 811 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 812 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 813 --rep_set_picking_method 'longest' \ | |
| 814 --sort_by 'otu' \ | |
| 815 --result_fp 'test-data/pick_rep_set/longest_otu_fasta.fasta' \ | |
| 816 --log_fp 'test-data/pick_rep_set/longest_otu_fasta.txt' | |
| 817 | |
| 818 pick_rep_set.py \ | |
| 819 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 820 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 821 --rep_set_picking_method 'most_abundant' \ | |
| 822 --sort_by 'otu' \ | |
| 823 --result_fp 'test-data/pick_rep_set/most_abundant_otu_fasta.fasta' \ | |
| 824 --log_fp 'test-data/pick_rep_set/most_abundant_otu_fasta.txt' | |
| 825 | |
| 826 pick_rep_set.py \ | |
| 827 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 828 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 829 --rep_set_picking_method 'random' \ | |
| 830 --sort_by 'otu' \ | |
| 831 --result_fp 'test-data/pick_rep_set/random_otu_fasta.fasta' \ | |
| 832 --log_fp 'test-data/pick_rep_set/random_otu_fasta.txt' | |
| 833 | |
| 834 pick_rep_set.py \ | |
| 835 --input_file 'test-data/pick_rep_set/seqs_otus.txt' \ | |
| 836 --fasta_file 'test-data/pick_rep_set/seqs.fna' \ | |
| 837 --rep_set_picking_method 'first' \ | |
| 838 --sort_by 'seq_id' \ | |
| 839 --result_fp 'test-data/pick_rep_set/first_seq_id_fasta.fasta' \ | |
| 840 --log_fp 'test-data/pick_rep_set/first_seq_id_fasta.txt' | |
| 841 | |
| 842 # plot_taxa_summary | |
| 843 plot_taxa_summary.py \ | |
| 844 --counts_fname 'test-data/plot_taxa_summary/phylum.txt' \ | |
| 845 --dir_path 'test-data/plot_taxa_summary/phylum' \ | |
| 846 --labels 'phylum' \ | |
| 847 --num_categories '20' \ | |
| 848 --background_color 'white' \ | |
| 849 --dpi '80' \ | |
| 850 --x_width '12' \ | |
| 851 --y_height '12' \ | |
| 852 --bar_width '0.75' \ | |
| 853 --type_of_file 'png' \ | |
| 854 --chart_type 'area,bar,pie' \ | |
| 855 --resize_nth_label '0' \ | |
| 856 --label_type 'categorical' | |
| 857 | |
| 858 plot_taxa_summary.py \ | |
| 859 --counts_fname 'test-data/plot_taxa_summary/phylum.txt,test-data/plot_taxa_summary/class.txt,test-data/plot_taxa_summary/genus.txt' \ | |
| 860 --dir_path 'test-data/plot_taxa_summary/phylum_class_genus' \ | |
| 861 --labels 'Phylum,Class,Genus' \ | |
| 862 --num_categories '20' \ | |
| 863 --background_color 'white' \ | |
| 864 --dpi '80' \ | |
| 865 --x_width '12' \ | |
| 866 --y_height '12' \ | |
| 867 --bar_width '0.75' \ | |
| 868 --type_of_file 'png' \ | |
| 869 --chart_type 'area,bar,pie' \ | |
| 870 --resize_nth_label '0' \ | |
| 871 --label_type 'categorical' | |
| 872 | |
| 873 plot_taxa_summary.py \ | |
| 874 --counts_fname 'test-data/plot_taxa_summary/class.txt' \ | |
| 875 --dir_path 'test-data/plot_taxa_summary/class' \ | |
| 876 --labels 'Class' \ | |
| 877 --num_categories '10' \ | |
| 878 --background_color 'white' \ | |
| 879 --dpi '80' \ | |
| 880 --x_width '12' \ | |
| 881 --y_height '12' \ | |
| 882 --bar_width '0.75' \ | |
| 883 --chart_type 'pie' \ | |
| 884 --type_of_file 'svg' \ | |
| 885 --include_html_legend \ | |
| 886 --resize_nth_label '0' \ | |
| 887 --label_type 'categorical' | |
| 888 | |
| 889 plot_taxa_summary.py \ | |
| 890 --counts_fname 'test-data/plot_taxa_summary/class.txt' \ | |
| 891 --dir_path 'test-data/plot_taxa_summary/class_colorby' \ | |
| 892 --labels 'Class' \ | |
| 893 --num_categories '20' \ | |
| 894 --colorby 'PC.636,PC.635' \ | |
| 895 --background_color 'white' \ | |
| 896 --dpi '80' \ | |
| 897 --x_width '12' \ | |
| 898 --y_height '12' \ | |
| 899 --bar_width '0.75' \ | |
| 900 --type_of_file 'pdf' \ | |
| 901 --chart_type 'area,bar,pie' \ | |
| 902 --resize_nth_label '0' \ | |
| 903 --label_type 'categorical' | |
| 904 | |
| 905 # split_libraries | |
| 906 split_libraries.py \ | |
| 907 --map 'test-data/split_libraries/mapping_file.txt' \ | |
| 908 -o split_libraries \ | |
| 909 --fasta 'test-data/split_libraries/reads_1.fna,test-data/split_libraries/reads_2.fna' \ | |
| 910 --qual 'test-data/split_libraries/reads_1.qual,test-data/split_libraries/reads_2.qual' \ | |
| 911 --min_qual_score 25 \ | |
| 912 --qual_score_window 0 \ | |
| 913 --record_qual_scores \ | |
| 914 --min_seq_length 200 \ | |
| 915 --max_seq_length 1000 \ | |
| 916 --max_ambig 6 \ | |
| 917 --max_homopolymer 6 \ | |
| 918 --max_primer_mismatch 0 \ | |
| 919 --barcode_type 'golay_12' \ | |
| 920 --max_barcode_errors 1.5 \ | |
| 921 --start_numbering_at 1 | |
| 922 cp split_libraries/seqs.fna 'test-data/split_libraries/seqs.fna' | |
| 923 cp split_libraries/split_library_log.txt 'test-data/split_libraries/split_library_log' | |
| 924 cp split_libraries/histograms.txt 'test-data/split_libraries/histograms.txt' | |
| 925 cp split_libraries/seqs_filtered.qual 'test-data/split_libraries/seqs_filtered.qual' | |
| 926 rm -rf split_libraries | |
| 927 | |
| 928 # split_libraries_fastq | |
| 929 split_libraries_fastq.py \ | |
| 930 --sequence_read_fps 'test-data/split_libraries_fastq/forward_reads.fastq' \ | |
| 931 -o split_libraries \ | |
| 932 --mapping_fps 'test-data/map.tsv' \ | |
| 933 --barcode_read_fps 'test-data/split_libraries_fastq/barcodes.fastq' \ | |
| 934 --store_qual_scores \ | |
| 935 --store_demultiplexed_fastq \ | |
| 936 --max_bad_run_length 3 \ | |
| 937 --min_per_read_length_fraction 0.75 \ | |
| 938 --sequence_max_n 0 \ | |
| 939 --start_seq_id 0 \ | |
| 940 --barcode_type 'golay_12' \ | |
| 941 --max_barcode_errors 1.5 | |
| 942 cp split_libraries/histograms.txt 'test-data/split_libraries_fastq/histograms.tabular' | |
| 943 cp split_libraries/seqs.fna 'test-data/split_libraries_fastq/sequences.fasta' | |
| 944 cp split_libraries/seqs.qual 'test-data/split_libraries_fastq/sequence_qualities.qual' | |
| 945 cp split_libraries/seqs.fastq 'test-data/split_libraries_fastq/demultiplexed_sequences.fastq' | |
| 946 rm -rf split_libraries | |
| 947 | |
| 948 # summarize_taxa | |
| 949 cp 'test-data/core_diversity_analyses/otu_table.biom' 'test-data/summarize_taxa/otu_table.biom' | |
| 950 cp 'test-data/core_diversity_analyses/map.txt' 'test-data/summarize_taxa/map.txt' | |
| 951 | |
| 952 summarize_taxa.py \ | |
| 953 -i 'test-data/summarize_taxa/otu_table.biom' \ | |
| 954 -o summarize_taxa_1 \ | |
| 955 -L '2,3,4,5,6' \ | |
| 956 -m 'test-data/summarize_taxa/map.txt' \ | |
| 957 --md_identifier "taxonomy" \ | |
| 958 --delimiter ";" | |
| 959 cp summarize_taxa_1/*_L2.txt "test-data/summarize_taxa/1_L2.txt" | |
| 960 cp summarize_taxa_1/*_L3.txt "test-data/summarize_taxa/1_L3.txt" | |
| 961 cp summarize_taxa_1/*_L4.txt "test-data/summarize_taxa/1_L4.txt" | |
| 962 cp summarize_taxa_1/*_L5.txt "test-data/summarize_taxa/1_L5.txt" | |
| 963 cp summarize_taxa_1/*_L6.txt "test-data/summarize_taxa/1_L6.txt" | |
| 964 rm -rf summarize_taxa_1 | |
| 965 | |
| 966 summarize_taxa.py \ | |
| 967 -i 'test-data/summarize_taxa/otu_table.biom' \ | |
| 968 -o summarize_taxa_2 \ | |
| 969 -L '3,6' \ | |
| 970 --md_identifier "taxonomy" \ | |
| 971 --delimiter ";" | |
| 972 cp summarize_taxa_2/*_L3.txt "test-data/summarize_taxa/2_L3.txt" | |
| 973 cp summarize_taxa_2/*_L6.txt "test-data/summarize_taxa/2_L6.txt" | |
| 974 rm -rf summarize_taxa_2 | |
| 975 | |
| 976 # summarize_taxa_through_plots | |
| 977 summarize_taxa_through_plots.py \ | |
| 978 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
| 979 --output_dir summarize_taxa_through_plots_mapping \ | |
| 980 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' | |
| 981 biom convert \ | |
| 982 -i 'summarize_taxa_through_plots_mapping/otu_table_L2.biom' \ | |
| 983 -o 'summarize_taxa_through_plots_mapping/otu_table_L2_json.biom' \ | |
| 984 --to-json | |
| 985 biom convert \ | |
| 986 -i 'summarize_taxa_through_plots_mapping/otu_table_L3.biom' \ | |
| 987 -o 'summarize_taxa_through_plots_mapping/otu_table_L3_json.biom' \ | |
| 988 --to-json | |
| 989 biom convert \ | |
| 990 -i 'summarize_taxa_through_plots_mapping/otu_table_L4.biom' \ | |
| 991 -o 'summarize_taxa_through_plots_mapping/otu_table_L4_json.biom' \ | |
| 992 --to-json | |
| 993 biom convert \ | |
| 994 -i 'summarize_taxa_through_plots_mapping/otu_table_L5.biom' \ | |
| 995 -o 'summarize_taxa_through_plots_mapping/otu_table_L5_json.biom' \ | |
| 996 --to-json | |
| 997 biom convert \ | |
| 998 -i 'summarize_taxa_through_plots_mapping/otu_table_L6.biom' \ | |
| 999 -o 'summarize_taxa_through_plots_mapping/otu_table_L6_json.biom' \ | |
| 1000 --to-json | |
| 1001 cp summarize_taxa_through_plots_mapping/*.txt test-data/summarize_taxa_through_plots/mapping/ | |
| 1002 cp summarize_taxa_through_plots_mapping/*_json.biom test-data/summarize_taxa_through_plots/mapping/ | |
| 1003 cp summarize_taxa_through_plots_mapping/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping/area_charts.html' | |
| 1004 cp summarize_taxa_through_plots_mapping/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping/bar_charts.html' | |
| 1005 | |
| 1006 summarize_taxa_through_plots.py \ | |
| 1007 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
| 1008 --output_dir summarize_taxa_through_plots_mapping_categories \ | |
| 1009 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' \ | |
| 1010 --mapping_category 'Treatment' | |
| 1011 biom convert \ | |
| 1012 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L2.biom' \ | |
| 1013 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L2_json.biom' \ | |
| 1014 --to-json | |
| 1015 biom convert \ | |
| 1016 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L3.biom' \ | |
| 1017 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L3_json.biom' \ | |
| 1018 --to-json | |
| 1019 biom convert \ | |
| 1020 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L4.biom' \ | |
| 1021 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L4_json.biom' \ | |
| 1022 --to-json | |
| 1023 biom convert \ | |
| 1024 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L5.biom' \ | |
| 1025 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L5_json.biom' \ | |
| 1026 --to-json | |
| 1027 biom convert \ | |
| 1028 -i 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L6.biom' \ | |
| 1029 -o 'summarize_taxa_through_plots_mapping_categories/Treatment_otu_table_L6_json.biom' \ | |
| 1030 --to-json | |
| 1031 cp summarize_taxa_through_plots_mapping_categories/*.txt test-data/summarize_taxa_through_plots/mapping_categories/ | |
| 1032 cp summarize_taxa_through_plots_mapping_categories/*_json.biom test-data/summarize_taxa_through_plots/mapping_categories/ | |
| 1033 cp summarize_taxa_through_plots_mapping_categories/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping_categories/area_charts.html' | |
| 1034 cp summarize_taxa_through_plots_mapping_categories/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping_categories/bar_charts.html' | |
| 1035 | |
| 1036 summarize_taxa_through_plots.py \ | |
| 1037 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
| 1038 --output_dir summarize_taxa_through_plots_mapping_sort \ | |
| 1039 --mapping_fp 'test-data/summarize_taxa_through_plots/Fasting_Map.txt' \ | |
| 1040 --sort | |
| 1041 biom convert \ | |
| 1042 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L2.biom' \ | |
| 1043 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L2_json.biom' \ | |
| 1044 --to-json | |
| 1045 biom convert \ | |
| 1046 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L3.biom' \ | |
| 1047 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L3_json.biom' \ | |
| 1048 --to-json | |
| 1049 biom convert \ | |
| 1050 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L4.biom' \ | |
| 1051 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L4_json.biom' \ | |
| 1052 --to-json | |
| 1053 biom convert \ | |
| 1054 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L5.biom' \ | |
| 1055 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L5_json.biom' \ | |
| 1056 --to-json | |
| 1057 biom convert \ | |
| 1058 -i 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L6.biom' \ | |
| 1059 -o 'summarize_taxa_through_plots_mapping_sort/otu_table_sorted_L6_json.biom' \ | |
| 1060 --to-json | |
| 1061 cp summarize_taxa_through_plots_mapping_sort/*.txt test-data/summarize_taxa_through_plots/mapping_sort/ | |
| 1062 cp summarize_taxa_through_plots_mapping_sort/*_json.biom test-data/summarize_taxa_through_plots/mapping_sort/ | |
| 1063 cp summarize_taxa_through_plots_mapping_sort/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/mapping_sort/area_charts.html' | |
| 1064 cp summarize_taxa_through_plots_mapping_sort/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/mapping_sort/bar_charts.html' | |
| 1065 | |
| 1066 summarize_taxa_through_plots.py \ | |
| 1067 --otu_table_fp 'test-data/summarize_taxa_through_plots/otu_table.biom' \ | |
| 1068 --output_dir summarize_taxa_through_plots_without_mapping | |
| 1069 biom convert \ | |
| 1070 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L2.biom' \ | |
| 1071 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L2_json.biom' \ | |
| 1072 --to-json | |
| 1073 biom convert \ | |
| 1074 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L3.biom' \ | |
| 1075 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L3_json.biom' \ | |
| 1076 --to-json | |
| 1077 biom convert \ | |
| 1078 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L4.biom' \ | |
| 1079 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L4_json.biom' \ | |
| 1080 --to-json | |
| 1081 biom convert \ | |
| 1082 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L5.biom' \ | |
| 1083 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L5_json.biom' \ | |
| 1084 --to-json | |
| 1085 biom convert \ | |
| 1086 -i 'summarize_taxa_through_plots_without_mapping/otu_table_L6.biom' \ | |
| 1087 -o 'summarize_taxa_through_plots_without_mapping/otu_table_L6_json.biom' \ | |
| 1088 --to-json | |
| 1089 cp summarize_taxa_through_plots_without_mapping/*.txt test-data/summarize_taxa_through_plots/without_mapping/ | |
| 1090 cp summarize_taxa_through_plots_without_mapping/*_json.biom test-data/summarize_taxa_through_plots/without_mapping/ | |
| 1091 cp summarize_taxa_through_plots_without_mapping/taxa_summary_plots/area_charts.html 'test-data/summarize_taxa_through_plots/without_mapping/area_charts.html' | |
| 1092 cp summarize_taxa_through_plots_without_mapping/taxa_summary_plots/bar_charts.html 'test-data/summarize_taxa_through_plots/without_mapping/bar_charts.html' | |
| 1093 | |
| 1094 # upgma_cluster | |
| 1095 upgma_cluster.py \ | |
| 1096 --input_path 'test-data/upgma_cluster/' \ | |
| 1097 --output_path 'test-data/upgma_cluster/' | |
| 1098 | |
| 1099 # validate_mapping_file | |
| 1100 validate_mapping_file.py \ | |
| 1101 -m 'test-data/validate_mapping_file/map.tsv' \ | |
| 1102 -o validate_mapping_file_output \ | |
| 1103 -c '_' | |
| 1104 cp validate_mapping_file_output/*.html 'test-data/validate_mapping_file/map.tsv.html' | |
| 1105 cp validate_mapping_file_output/*.log 'test-data/validate_mapping_file/map.tsv.log' | |
| 1106 cp validate_mapping_file_output/*corrected.txt 'test-data/validate_mapping_file/map.tsv_corrected.txt' | |
| 1107 rm -rf validate_mapping_file_output | |
| 1108 | |
| 1109 | |
| 1110 | |
| 1111 | |
| 1112 | |
| 1113 | |
| 1114 | |
| 1115 | |
| 1116 | |
| 1117 | |
| 1118 | |
| 1119 | |
| 1120 | |
| 1121 | |
| 1122 | |
| 1123 | |
| 1124 | |
| 1125 | |
| 1126 | 
