# HG changeset patch # User jackcurragh # Date 1648039895 0 # Node ID 5bdc8418c3785825307c28dcc82ddcf250316c81 Uploaded diff -r 000000000000 -r 5bdc8418c378 samtools_index/macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/macros.xml Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,223 @@ + + + + samtools + + + + 1.13 + 20.05 + + + + + + + + + @HELP@ + + + + + + + + + + + + + + + + + + + + + + @HELP@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + ^[^\s'\":]+(:\d+(-\d+){0,1}){0,1}$ + + + + + + + + + + + + + @misc{SAM_def, + title={Definition of SAM/BAM format}, + url = {https://samtools.github.io/hts-specs/},} + + 10.1093/bioinformatics/btp352 + 10.1093/bioinformatics/btr076 + 10.1093/bioinformatics/btr509 + + @misc{Danecek_et_al, + Author={Danecek, P., Schiffels, S., Durbin, R.}, + title={Multiallelic calling model in bcftools (-m)}, + url = {http://samtools.github.io/bcftools/call-m.pdf},} + + + @misc{Durbin_VCQC, + Author={Durbin, R.}, + title={Segregation based metric for variant call QC}, + url = {http://samtools.github.io/bcftools/rd-SegBias.pdf},} + + + @misc{Li_SamMath, + Author={Li, H.}, + title={Mathematical Notes on SAMtools Algorithms}, + url = {http://www.broadinstitute.org/gatk/media/docs/Samtools.pdf},} + + + @misc{SamTools_github, + title={SAMTools GitHub page}, + url = {https://github.com/samtools/samtools},} + + + + + &1 | grep Version]]> + + + + + + + diff -r 000000000000 -r 5bdc8418c378 samtools_index/samtools_index.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/samtools_index.xml Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,51 @@ + + order of storing aligned sequences + + macros.xml + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +**What it does** + +Indexes a BAM file + + + diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1.bam Binary file samtools_index/test-data/1.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1.bam.bai Binary file samtools_index/test-data/1.bam.bai has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1_sort.bam Binary file samtools_index/test-data/1_sort.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1_sort_read_names.bam Binary file samtools_index/test-data/1_sort_read_names.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/minhash.expected.bam Binary file samtools_index/test-data/minhash.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/name.sort.expected.bam Binary file samtools_index/test-data/name.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/name.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/name.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,28 @@ +@HD VN:1.4 SO:queryname +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@RG ID:fish PG:donkey +@RG ID:cow PU:13_&^&&*(:332 +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@PG ID:moose +@PG PP:moose ID:cow +@CO +r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull +r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull +r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt +r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt +r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt +r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow +r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt +r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt +u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ??????????????????????? +x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull +x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull +x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull +x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull +x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull +x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/pos.sort.expected.bam Binary file samtools_index/test-data/pos.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/pos.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/pos.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,28 @@ +@HD VN:1.4 SO:coordinate +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@RG ID:fish PG:donkey +@RG ID:cow PU:13_&^&&*(:332 +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@PG ID:moose +@PG PP:moose ID:cow +@CO +r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull +r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull +r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt +r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt +r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow +r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt +r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt +r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt +x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull +x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull +x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull +x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull +x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull +x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow +u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ??????????????????????? diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.as.sort.expected.bam Binary file samtools_index/test-data/tag.as.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.as.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/tag.as.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,24 @@ +@HD VN:1.4 SO:unknown +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@PG ID:llama +@RG ID:fish PG:llama +@RG ID:cow PU:13_&^&&*(:332 PG:donkey +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@CO Do you know? +r006 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:colt PG:Z:donkey FI:i:3 +x11 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:cow PG:Z:bull FI:Z:a +r007 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:donkey AS:i:-5 FI:f:3.5 +x10 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:cow PG:Z:bull AS:i:0 FI:A:b +r007 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:colt PG:Z:donkey AS:i:1 FI:i:4 +r005 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:colt PG:Z:donkey AS:i:10 FI:i:5 +x8 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:cow PG:Z:bull AS:i:10 FI:f:1.5 +r006 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 RG:Z:colt PG:Z:donkey AS:i:20 FI:f:4.5 +x9 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:cow PG:Z:bull AS:i:20 FI:i:1 +x7 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:cow PG:Z:bull AS:i:50 FI:i:2 +r005 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:colt PG:Z:donkey AS:i:100 FI:f:2.5 +x12 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow PG:Z:bull AS:i:65100 diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.fi.sort.expected.bam Binary file samtools_index/test-data/tag.fi.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.fi.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/tag.fi.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,24 @@ +@HD VN:1.4 SO:unknown +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@PG ID:llama +@RG ID:fish PG:llama +@RG ID:cow PU:13_&^&&*(:332 PG:donkey +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@CO Do you know? +x12 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow PG:Z:bull AS:i:65100 +x10 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:cow PG:Z:bull AS:i:0 FI:A:b +x11 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:cow PG:Z:bull FI:Z:a +x9 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:cow PG:Z:bull AS:i:20 FI:i:1 +x8 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:cow PG:Z:bull AS:i:10 FI:f:1.5 +x7 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:cow PG:Z:bull AS:i:50 FI:i:2 +r005 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:colt PG:Z:donkey AS:i:100 FI:f:2.5 +r006 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:colt PG:Z:donkey FI:i:3 +r007 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:donkey AS:i:-5 FI:f:3.5 +r007 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:colt PG:Z:donkey AS:i:1 FI:i:4 +r006 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 RG:Z:colt PG:Z:donkey AS:i:20 FI:f:4.5 +r005 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:colt PG:Z:donkey AS:i:10 FI:i:5 diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.n.sort.expected.bam Binary file samtools_index/test-data/tag.rg.n.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.n.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/tag.rg.n.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,28 @@ +@HD VN:1.4 SO:unknown +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@RG ID:fish PG:donkey +@RG ID:cow PU:13_&^&&*(:332 +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@PG ID:moose +@PG PP:moose ID:cow +@CO +r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt +u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ??????????????????????? +r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt +x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull +x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull +r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull +r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull +r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow +r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt +x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow +r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt +r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt +x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull +x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull +x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.sort.expected.bam Binary file samtools_index/test-data/tag.rg.sort.expected.bam has changed diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.sort.expected.sam --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/samtools_index/test-data/tag.rg.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000 @@ -0,0 +1,28 @@ +@HD VN:1.4 SO:unknown +@SQ SN:insert LN:599 +@SQ SN:ref1 LN:45 +@SQ SN:ref2 LN:40 +@SQ SN:ref3 LN:4 +@RG ID:fish PG:donkey +@RG ID:cow PU:13_&^&&*(:332 +@RG PU:*9u8jkjjkjd: ID:colt +@PG ID:bull PP:donkey +@PG ID:donkey +@PG ID:moose +@PG PP:moose ID:cow +@CO +r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt +u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ??????????????????????? +r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt +x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull +x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull +r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull +r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull +r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow +r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt +x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow +r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt +r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt +x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull +x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull +x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/test_input_1_a.bam Binary file samtools_index/test-data/test_input_1_a.bam has changed