# HG changeset patch
# User jackcurragh
# Date 1648039895 0
# Node ID 5bdc8418c3785825307c28dcc82ddcf250316c81
Uploaded
diff -r 000000000000 -r 5bdc8418c378 samtools_index/macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/macros.xml Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,223 @@
+
+
+
+ samtools
+
+
+
+ 1.13
+ 20.05
+
+
+
+
+
+
+
+
+ @HELP@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ @HELP@
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ ^[^\s'\":]+(:\d+(-\d+){0,1}){0,1}$
+
+
+
+
+
+
+
+
+
+
+
+
+ @misc{SAM_def,
+ title={Definition of SAM/BAM format},
+ url = {https://samtools.github.io/hts-specs/},}
+
+ 10.1093/bioinformatics/btp352
+ 10.1093/bioinformatics/btr076
+ 10.1093/bioinformatics/btr509
+
+ @misc{Danecek_et_al,
+ Author={Danecek, P., Schiffels, S., Durbin, R.},
+ title={Multiallelic calling model in bcftools (-m)},
+ url = {http://samtools.github.io/bcftools/call-m.pdf},}
+
+
+ @misc{Durbin_VCQC,
+ Author={Durbin, R.},
+ title={Segregation based metric for variant call QC},
+ url = {http://samtools.github.io/bcftools/rd-SegBias.pdf},}
+
+
+ @misc{Li_SamMath,
+ Author={Li, H.},
+ title={Mathematical Notes on SAMtools Algorithms},
+ url = {http://www.broadinstitute.org/gatk/media/docs/Samtools.pdf},}
+
+
+ @misc{SamTools_github,
+ title={SAMTools GitHub page},
+ url = {https://github.com/samtools/samtools},}
+
+
+
+
+ &1 | grep Version]]>
+
+
+
+
+
+
+
diff -r 000000000000 -r 5bdc8418c378 samtools_index/samtools_index.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/samtools_index.xml Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,51 @@
+
+ order of storing aligned sequences
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+**What it does**
+
+Indexes a BAM file
+
+
+
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1.bam
Binary file samtools_index/test-data/1.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1.bam.bai
Binary file samtools_index/test-data/1.bam.bai has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1_sort.bam
Binary file samtools_index/test-data/1_sort.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/1_sort_read_names.bam
Binary file samtools_index/test-data/1_sort_read_names.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/minhash.expected.bam
Binary file samtools_index/test-data/minhash.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/name.sort.expected.bam
Binary file samtools_index/test-data/name.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/name.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/name.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,28 @@
+@HD VN:1.4 SO:queryname
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@RG ID:fish PG:donkey
+@RG ID:cow PU:13_&^&&*(:332
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@PG ID:moose
+@PG PP:moose ID:cow
+@CO
+r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull
+r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull
+r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt
+r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt
+r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt
+r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow
+r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt
+r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt
+u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ???????????????????????
+x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull
+x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull
+x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull
+x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull
+x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull
+x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/pos.sort.expected.bam
Binary file samtools_index/test-data/pos.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/pos.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/pos.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,28 @@
+@HD VN:1.4 SO:coordinate
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@RG ID:fish PG:donkey
+@RG ID:cow PU:13_&^&&*(:332
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@PG ID:moose
+@PG PP:moose ID:cow
+@CO
+r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull
+r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull
+r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt
+r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt
+r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow
+r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt
+r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt
+r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt
+x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull
+x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull
+x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull
+x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull
+x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull
+x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow
+u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ???????????????????????
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.as.sort.expected.bam
Binary file samtools_index/test-data/tag.as.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.as.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/tag.as.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,24 @@
+@HD VN:1.4 SO:unknown
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@PG ID:llama
+@RG ID:fish PG:llama
+@RG ID:cow PU:13_&^&&*(:332 PG:donkey
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@CO Do you know?
+r006 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:colt PG:Z:donkey FI:i:3
+x11 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:cow PG:Z:bull FI:Z:a
+r007 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:donkey AS:i:-5 FI:f:3.5
+x10 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:cow PG:Z:bull AS:i:0 FI:A:b
+r007 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:colt PG:Z:donkey AS:i:1 FI:i:4
+r005 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:colt PG:Z:donkey AS:i:10 FI:i:5
+x8 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:cow PG:Z:bull AS:i:10 FI:f:1.5
+r006 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 RG:Z:colt PG:Z:donkey AS:i:20 FI:f:4.5
+x9 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:cow PG:Z:bull AS:i:20 FI:i:1
+x7 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:cow PG:Z:bull AS:i:50 FI:i:2
+r005 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:colt PG:Z:donkey AS:i:100 FI:f:2.5
+x12 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow PG:Z:bull AS:i:65100
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.fi.sort.expected.bam
Binary file samtools_index/test-data/tag.fi.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.fi.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/tag.fi.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,24 @@
+@HD VN:1.4 SO:unknown
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@PG ID:llama
+@RG ID:fish PG:llama
+@RG ID:cow PU:13_&^&&*(:332 PG:donkey
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@CO Do you know?
+x12 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow PG:Z:bull AS:i:65100
+x10 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:cow PG:Z:bull AS:i:0 FI:A:b
+x11 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:cow PG:Z:bull FI:Z:a
+x9 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:cow PG:Z:bull AS:i:20 FI:i:1
+x8 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:cow PG:Z:bull AS:i:10 FI:f:1.5
+x7 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:cow PG:Z:bull AS:i:50 FI:i:2
+r005 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:colt PG:Z:donkey AS:i:100 FI:f:2.5
+r006 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:colt PG:Z:donkey FI:i:3
+r007 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:donkey AS:i:-5 FI:f:3.5
+r007 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:colt PG:Z:donkey AS:i:1 FI:i:4
+r006 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 RG:Z:colt PG:Z:donkey AS:i:20 FI:f:4.5
+r005 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:colt PG:Z:donkey AS:i:10 FI:i:5
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.n.sort.expected.bam
Binary file samtools_index/test-data/tag.rg.n.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.n.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/tag.rg.n.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,28 @@
+@HD VN:1.4 SO:unknown
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@RG ID:fish PG:donkey
+@RG ID:cow PU:13_&^&&*(:332
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@PG ID:moose
+@PG PP:moose ID:cow
+@CO
+r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt
+u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ???????????????????????
+r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt
+x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull
+x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull
+r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull
+r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull
+r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow
+r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt
+x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow
+r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt
+r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt
+x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull
+x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull
+x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.sort.expected.bam
Binary file samtools_index/test-data/tag.rg.sort.expected.bam has changed
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/tag.rg.sort.expected.sam
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/samtools_index/test-data/tag.rg.sort.expected.sam Wed Mar 23 12:51:35 2022 +0000
@@ -0,0 +1,28 @@
+@HD VN:1.4 SO:unknown
+@SQ SN:insert LN:599
+@SQ SN:ref1 LN:45
+@SQ SN:ref2 LN:40
+@SQ SN:ref3 LN:4
+@RG ID:fish PG:donkey
+@RG ID:cow PU:13_&^&&*(:332
+@RG PU:*9u8jkjjkjd: ID:colt
+@PG ID:bull PP:donkey
+@PG ID:donkey
+@PG ID:moose
+@PG PP:moose ID:cow
+@CO
+r002 0 ref1 9 30 1S2I6M1P1I1P1I4M2I * 0 0 AAAAGATAAGGGATAAA * XA:Z:abc XB:i:-10 PG:Z:colt
+u1 4 * 0 30 23M * 0 0 TAATTAAGTCTACAGAAAAAAAA ???????????????????????
+r004 0 ref1 16 30 6M14N1I5M * 0 0 ATAGCTCTCAGC * RG:Z:colt PG:Z:colt
+x1 0 ref2 1 30 20M * 0 0 AGGTTTTATAAAACAAATAA * RG:Z:colt PG:Z:bull
+x2 0 ref2 2 30 21M * 0 0 GGTTTTATAAAACAAATAATT ????????????????????? RG:Z:colt PG:Z:bull
+r000 99 insert 50 30 10M = 80 30 ATTTAGCTAC AAAAAAAAAA RG:Z:cow PG:Z:bull
+r000 211 insert 80 30 10M = 50 -30 CCCAATCATT AAAAAAAAAA RG:Z:cow PG:Z:bull
+r003 0 ref1 9 30 5H6M * 0 0 AGCTAA * RG:Z:cow
+r003 16 ref1 29 30 6H5M * 0 0 TAGGC * RG:Z:cow PG:Z:colt
+x6 0 ref2 14 30 23M * 0 0 TAATTAAGTCTACAGAGCAACTA ??????????????????????? RG:Z:cow
+r001 163 ref1 7 30 8M4I4M1D3M = 37 39 TTAGATAAAGAGGATACTG * XX:B:S,12561,2,20,112 YY:i:100 RG:Z:fish PG:Z:colt
+r001 83 ref1 37 30 9M = 7 -39 CAGCGCCAT * RG:Z:fish PG:Z:colt
+x3 0 ref2 6 30 9M4I13M * 0 0 TTATAAAACAAATAATTAAGTCTACA ?????????????????????????? RG:Z:fish PG:Z:bull
+x4 0 ref2 10 30 25M * 0 0 CAAATAATTAAGTCTACAGAGCAAC ????????????????????????? RG:Z:fish PG:Z:bull
+x5 0 ref2 12 30 24M * 0 0 AATAATTAAGTCTACAGAGCAACT ???????????????????????? RG:Z:fish PG:Z:bull
diff -r 000000000000 -r 5bdc8418c378 samtools_index/test-data/test_input_1_a.bam
Binary file samtools_index/test-data/test_input_1_a.bam has changed