annotate lib/config.pl @ 3:17ce4f3bffa2 default tip

Uploaded
author jesse-erdmann
date Tue, 24 Jan 2012 18:33:41 -0500
parents 1437a2df99c0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
1 use DBI;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
2
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
3 #
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
4 # Database stuff
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
5 #
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
6
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
7 $dbh; # database handler
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
8 $db_name = 'largaespada_NGS_insertion_test';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
9 #my $db_username = 'insertion_larga';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
10 #my $db_password = 'uwtc.Pzc92';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
11 $db_username = 'sarvera';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
12 $db_password = 'fn101bcc';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
13
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
14 $db_host = '127.0.0.1;mysql_local_infile=1';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
15 $db_type = 'mysql';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
16 $data_source = "DBI:$db_type:database=$db_name;host=$db_host";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
17
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
18 #
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
19 # global values
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
20 #
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
21 # allows multiple active instances to be running in the db...
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
22 $proj = 'merge_science';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
23 $library_percent ='0.0001';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
24
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
25 $CIS_total_pvalue = '0.05';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
26 $CIS_library_pvalue = '0.05';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
27 $CIS_region_pvalue = '0.05';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
28
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
29 $cocis_threshold ='0.001';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
30
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
31 $dbh = DBI->connect($data_source, $db_username, $db_password,
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
32 { RaiseError => 1, AutoCommit => 0 });
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
33
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
34 sub resolve_barcodes {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
35 #2.1 map the barcodes to the sequences..must change (sequence, #) to length of barcode +1 based on barcode sequence length!.
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
36 #Currently set up for 6,10,12 base barcodes.
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
37 ####for 6mer barcodes...
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
38 #$sth = $dbh->prepare("create table illumina_decoded_$proj select library, id, substring(sequence,7) as decoded_sequence from barcode_$proj,illumina_raw_$proj where sequence like concat(seq,'%')");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
39 ####for 10mer barcodes...
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
40 $sth = $dbh->prepare("create table illumina_decoded_$proj select library, id, substring(sequence,11) as decoded_sequence from barcode_$proj,illumina_raw_$proj where sequence like concat(seq,'%')");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
41 #for 12mer barcodes...
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
42 #$sth = $dbh->prepare("create table illumina_decoded_$proj select library, id, substring(sequence,13) as decoded_sequence from barcode_$proj,illumina_raw_$proj where sequence like concat(seq,'%')");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
43
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
44 $sth->execute;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
45
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
46 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
47
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
48 sub resolve_IRDR {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
49 #2.3
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
50 #different options available this section needs to be optomized for each dataset
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
51 #for lung 454 data
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
52 $sth = $dbh->prepare("create table illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,32) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like '_____TGTATGTAAACTTCCGACTTCAACTG%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
53
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
54 $sth->execute;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
55 $sth = $dbh->prepare("insert into illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,31) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like '_____TGTATGTAACTTCCGACTTCAACTG%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
56
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
57
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
58
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
59 #$sth = $dbh->prepare("create table illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,31) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like 'TTAAGTGTATGTAACTTCCGACTTCAACTG%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
60
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
61 #for illumina data
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
62 #$sth = $dbh->prepare("create table illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,27) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like 'TGTATGTAAACTTCCGACTTCAACTG%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
63
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
64 #for illumina_2 data
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
65 #$sth = $dbh->prepare("create table illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,30) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like '___TGTATGTAAACTTCCGACTTCAACTG%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
66
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
67 #for MULV virus
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
68 #$sth = $dbh->prepare("create table illumina_without_IRDR_$proj select library,id,substring(decoded_sequence,26) as insertion_sequence, 'good' as type from illumina_decoded_$proj where decoded_sequence like 'CCAAACCTACAGGTGGGGTCTTTCA%'");
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
69 $sth->execute;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
70 }